機械学習を用いて株価の上昇と下落を予測する(ツール類、ワンタッチ呼び出し付)

5527 ワード

1、前置き準備
データソースはtushare proを使用して、具体的な操作はリンクを見てください、登録はTushare金融ビッグデータオープンコミュニティを使用することができます
2、直接ソースコード
パッケージができていないので、コードを繰り返して、間に合わせてみましょう.pythonはあまりできません.
# -*- coding: utf-8 -*-
import datetime
import os
import time

import numpy as np
import tushare as ts
from sklearn import svm
import joblib


class SvmUtil(object):

    def __init__(self):
        self.pro = ts.pro_api('   tushare token')

    def svm_learning(self, stockCode):
        end_time = time.strftime('%Y%m%d', time.localtime(time.time()))
        start_year = int(time.strftime('%Y', time.localtime(time.time()))) - 2
        month_day = time.strftime('%m%d', time.localtime(time.time()))
        start_time = '{}{}'.format(start_year, month_day)
        #     
        df = self.pro.daily(ts_code=stockCode, start_date=start_time, end_date=end_time)

        days_value = df['trade_date'].values[::-1]
        days_close = df['close'].values[::-1]
        days = []
        #         
        for i in range(len(days_value)):
            days.append(str(days_value[i]))

        x_all = []
        y_all = []
        for index in range(15, (len(days) - 5)):
            #       15        
            start_day = days[index - 15]
            end_day = days[index]
            data = self.pro.daily(ts_code=stockCode, start_date=start_day, end_date=end_day)
            open = data['open'].values[::-1]
            close = data['close'].values[::-1]
            max_x = data['high'].values[::-1]
            min_n = data['low'].values[::-1]
            amount = data['amount'].values[::-1]
            volume = []
            for i in range(len(close)):
                volume_temp = amount[i] / close[i]
                volume.append(volume_temp)

            open_mean = open[-1] / np.mean(open)  #    /  
            close_mean = close[-1] / np.mean(close)  #    /  
            diff_close_open_mean = close_mean - open_mean  #      -     
            volume_mean = volume[-1] / np.mean(volume)  #   /  
            max_mean = max_x[-1] / np.mean(max_x)  #    /  
            min_mean = min_n[-1] / np.mean(min_n)  #    /  
            diff_max_min_mean = max_mean - min_mean  #      -     
            vol = volume[-1]
            return_now = close[-1] / close[0]  #      
            std = np.std(np.array(close), axis=0)  #      

            #              X
            # features      
            # features = [close_mean, volume_mean, max_mean, min_mean, vol, return_now, std]
            features = [open_mean, close_mean, diff_close_open_mean, volume_mean, max_mean, min_mean, diff_max_min_mean,
                        vol, return_now, std]
            x_all.append(features)

        #            
        for i in range(len(days_close) - 20):
            if days_close[i + 20] > days_close[i + 15]:
                label = 1
            else:
                label = 0
            y_all.append(label)

        x_train = x_all[: -1]
        y_train = y_all[: -1]
        #   SVM
        model = svm.SVC(C=1.0, kernel='rbf', degree=3, gamma='auto', coef0=0.0, shrinking=True, probability=False,
                        tol=0.001, cache_size=400, verbose=False, max_iter=-1,
                        decision_function_shape='ovr', random_state=None)
        model.fit(x_train, y_train)
        joblib.dump(model, stockCode[:-3] + "_model.m")

    def svm_predict(self, stockCode):
        if not (os.path.exists(stockCode[:-3] + "_model.m")):
            self.svm_learning(stockCode)
        today = datetime.date.today()
        first = today.replace(day=1)
        last_month = first - datetime.timedelta(days=15)
        start_time = last_month.strftime("%Y%m%d")
        end_time = time.strftime('%Y%m%d', time.localtime(time.time()))
        model = joblib.load(stockCode[:-3] + "_model.m")
        df = self.pro.daily(ts_code=stockCode, start_date=start_time, end_date=end_time)
        open = df['open'].values[::-1]
        close = df['close'].values[::-1]
        train_max_x = df['high'].values[::-1]
        train_min_n = df['low'].values[::-1]
        train_amount = df['amount'].values[::-1]
        volume = []
        for i in range(len(close)):
            volume_temp = train_amount[i] / close[i]
            volume.append(volume_temp)

        open_mean = open[-1] / np.mean(open)
        close_mean = close[-1] / np.mean(close)
        diff_close_open_mean = close_mean - open_mean
        volume_mean = volume[-1] / np.mean(volume)
        max_mean = train_max_x[-1] / np.mean(train_max_x)
        min_mean = train_min_n[-1] / np.mean(train_min_n)
        diff_max_min_mean = max_mean - min_mean
        vol = volume[-1]
        return_now = close[-1] / close[0]
        std = np.std(np.array(close), axis=0)

        #            
        # features = [close_mean, volume_mean, max_mean, min_mean, vol, return_now, std]
        features = [open_mean, close_mean, diff_close_open_mean, volume_mean, max_mean, min_mean, diff_max_min_mean,
                    vol, return_now, std]
        features = np.array(features).reshape(1, -1)
        prediction = model.predict(features)[0]
        return prediction


if __name__ == '__main__':
    code = '002277.SZ'
    # SvmUtil().svm_learning(code)
    SvmUtil().svm_predict(code)

本文はブログの1文の多発プラットフォームOpenWriteから発表します!