4 years ago · 08b772217f
--- a/mix/mix_predict_180.py
+++ b/mix/mix_predict_180.py
@@ -92,7 +92,7 @@ def predict(file_path='', model_path='15min_dnn_seq.h5', idx=-1):
 
				 
			
 
				 if __name__ == '__main__':
			
 
				     # predict(file_path='D:\\data\\quantization\\stock181_18d_test.log', model_path='181_18d_mix_6D_ma5_s_seq.h5')
			
 
				-    predict(file_path='D:\\data\\quantization\\stock186A_18d_train1.log', model_path='186A_18d_mix_6D_ma5_s_seq.h5')
			
 
				+    predict(file_path='D:\\data\\quantization\\stock186E_18d_train1.log', model_path='186E_18d_mix_6D_ma5_s_seq.h5')
			
 
				     # predict(file_path='D:\\data\\quantization\\stock6_test.log', model_path='15m_dnn_seq.h5')
			
 
				     # multi_predict(model='15_18d')
			
 
				     # predict_today(20200229, model='11_18d')
			
--- a/mix/mix_predict_everyday.py
+++ b/mix/mix_predict_everyday.py
@@ -18,10 +18,25 @@ holder_stock_list = [
 
				                         # 基础建设
			
 
				                         '300041.SZ', '603568.SH', '000967.SZ', '603018.SH',
			
 
				                         # B
			
 
				-                        '002555.SZ', '002174.SZ'
			
 
				-
			
 
				-
			
 
				-    ]
			
 
				+                        '002555.SZ', '002174.SZ',
			
 
				+                        # ROE
			
 
				+    '002976.SZ', '002847.SZ', '002597.SZ', '300686.SZ', '000708.SZ', '603948.SH', '600507.SH', '300401.SZ', '002714.SZ', '600732.SH', '300033.SZ', '300822.SZ', '300821.SZ',
			
 
				+    '002458.SZ', '000708.SZ', '600732.SH', '603719.SH', '300821.SZ', '300800.SZ', '300816.SZ', '300812.SZ', '603195.SH', '300815.SZ', '603053.SH', '603551.SH', '002975.SZ',
			
 
				+    '603949.SH', '002970.SZ', '300809.SZ', '002968.SZ', '300559.SZ', '002512.SZ', '300783.SZ', '300003.SZ', '603489.SH', '300564.SZ', '600802.SH', '002600.SZ',
			
 
				+    '000933.SZ', '601918.SH', '000651.SZ', '002916.SZ', '000568.SZ', '000717.SZ', '600452.SH', '603589.SH', '600690.SH', '603886.SH', '300117.SZ', '000858.SZ', '002102.SZ',
			
 
				+    '300136.SZ', '600801.SH', '600436.SH', '300401.SZ', '002190.SZ', '300122.SZ', '002299.SZ', '603610.SH', '002963.SZ', '600486.SH', '300601.SZ', '300682.SZ', '300771.SZ',
			
 
				+    '000868.SZ', '002607.SZ', '603068.SH', '603508.SH', '603658.SH', '300571.SZ', '603868.SH', '600768.SH', '300760.SZ', '002901.SZ', '603638.SH', '601100.SH', '002032.SZ',
			
 
				+    '600083.SH', '600507.SH', '603288.SH', '002304.SZ', '000963.SZ', '300572.SZ', '000885.SZ', '600995.SH', '300080.SZ', '601888.SH', '000048.SZ', '000333.SZ', '300529.SZ',
			
 
				+    '000537.SZ', '002869.SZ', '600217.SH', '000526.SZ', '600887.SH', '002161.SZ', '600267.SH', '600668.SH', '600052.SH', '002379.SZ', '603369.SH', '601360.SH', '002833.SZ',
			
 
				+    '002035.SZ', '600031.SH', '600678.SH', '600398.SH', '600587.SH', '600763.SH', '002016.SZ', '603816.SH', '000031.SZ', '002555.SZ', '603983.SH', '002746.SZ', '603899.SH',
			
 
				+    '300595.SZ', '300632.SZ', '600809.SH', '002507.SZ', '300198.SZ', '600779.SH', '603568.SH', '300638.SZ', '002011.SZ', '603517.SH', '000661.SZ', '300630.SZ', '000895.SZ',
			
 
				+    '002841.SZ', '300602.SZ', '300418.SZ', '603737.SH', '002755.SZ', '002803.SZ', '002182.SZ', '600132.SH', '300725.SZ', '600346.SH', '300015.SZ', '300014.SZ', '300628.SZ',
			
 
				+    '000789.SZ', '600368.SH', '300776.SZ', '600570.SH', '000509.SZ', '600338.SH', '300770.SZ', '600309.SH', '000596.SZ', '300702.SZ', '002271.SZ', '300782.SZ', '300577.SZ',
			
 
				+    '603505.SH', '603160.SH', '300761.SZ', '603327.SH', '002458.SZ', '300146.SZ', '002463.SZ', '300417.SZ', '600566.SH', '002372.SZ', '600585.SH', '000848.SZ', '600519.SH',
			
 
				+    '000672.SZ', '300357.SZ', '002234.SZ', '603444.SH', '300236.SZ', '603360.SH', '002677.SZ', '300487.SZ', '600319.SH', '002415.SZ', '000403.SZ', '600340.SH', '601318.SH',
			
 
				+
			
 
				+
			
 
				+]
			
 
				 
			
 
				 
			
 
				 def read_data(path):
			
--- a/mix/mix_train_180.py
+++ b/mix/mix_train_180.py
@@ -18,11 +18,11 @@ from keras.callbacks import EarlyStopping
 
				 
			
 
				 early_stopping = EarlyStopping(monitor='accuracy', patience=5, verbose=2)
			
 
				 
			
 
				-epochs= 138
			
 
				-size = 400000 #18W 60W
			
 
				-file_path = 'D:\\data\\quantization\\stock186B_18d_train2.log'
			
 
				-model_path = '186B_18d_mix_6D_ma5_s_seq.h5'
			
 
				-file_path1='D:\\data\\quantization\\stock186B_18d_test.log'
			
 
				+epochs= 68
			
 
				+size = 380000 #18W 60W
			
 
				+file_path = 'D:\\data\\quantization\\stock186E_18d_train2.log'
			
 
				+model_path = '186E_18d_mix_6D_ma5_s_seq.h5'
			
 
				+file_path1='D:\\data\\quantization\\stock186E_18d_test.log'
			
 
				 '''
			
 
				 1 MACD                      
			
 
				 4 MACD不在cnn范围内         50,97,43
			
@@ -34,10 +34,10 @@ file_path1='D:\\data\\quantization\\stock186B_18d_test.log'
 
				 '''
			
 
				 '''
			
 
				 a 加上大盘涨停和个股统计 涨停/跌停/创业板涨停跌停   39,98,39
			
 
				-b 加上大盘涨停和个股统计 t1,t2,t3....    
			
 
				-c MACD + ROC
			
 
				-d DMI + ROC
			
 
				-e RSI + ROC           
			
 
				+b 加上大盘涨停和个股统计 t1,t2,t3....               35,98,41
			
 
				+c MACD + ROC                                        50,98,43
			
 
				+d DMI + ROC                                         48,98,43
			
 
				+e RSI + ROC                                         44,97,43
			
 
				 '''
			
 
				 
			
 
				 def read_data(path, path1=file_path1):
			
@@ -48,7 +48,7 @@ def read_data(path, path1=file_path1):
 
				             lines.append(line)
			
 
				 
			
 
				     with open(path1) as f:
			
 
				-        for x in range(50000):
			
 
				+        for x in range(20000):
			
 
				             line = eval(f.readline().strip())
			
 
				             lines.append(line)
			
 
				 
			
--- a/mix/mix_train_200.py
+++ b/mix/mix_train_200.py
@@ -0,0 +1,194 @@
 
				+import keras
			
 
				+# -*- encoding:utf-8 -*-
			
 
				+import numpy as np
			
 
				+from keras.models import Sequential
			
 
				+# 优化方法选用Adam(其实可选项有很多，如SGD)
			
 
				+from keras.optimizers import Adam
			
 
				+import random
			
 
				+from keras.models import load_model
			
 
				+from imblearn.over_sampling import RandomOverSampler
			
 
				+from keras.utils import np_utils
			
 
				+# 用于模型初始化，Conv2D模型初始化、Activation激活函数，MaxPooling2D是池化层
			
 
				+# Flatten作用是将多位输入进行一维化
			
 
				+# Dense是全连接层
			
 
				+from keras.layers import Conv2D, Activation, MaxPool2D, Flatten, Dense,Dropout,Input,MaxPooling2D,BatchNormalization,concatenate
			
 
				+from keras import regularizers
			
 
				+from keras.models import Model
			
 
				+from keras.callbacks import EarlyStopping
			
 
				+
			
 
				+early_stopping = EarlyStopping(monitor='accuracy', patience=5, verbose=2)
			
 
				+
			
 
				+epochs= 68
			
 
				+size = 400000 #18W 60W
			
 
				+file_path = 'D:\\data\\quantization\\stock200_18d_train2.log'
			
 
				+model_path = '200_18d_mix_6D_ma5_s_seq.h5'
			
 
				+file_path1='D:\\data\\quantization\\stock200_18d_test.log'
			
 
				+'''
			
 
				+ROC
			
 
				+1大盘涨停 涨停/跌停/创业板涨停跌停   
			
 
				+2大盘涨停 涨停/跌停
			
 
				+3beta函数修正
			
 
				+4用两个kernel
			
 
				+
			
 
				+'''
			
 
				+
			
 
				+def read_data(path, path1=file_path1):
			
 
				+    lines = []
			
 
				+    with open(path) as f:
			
 
				+        for x in range(size): #610000
			
 
				+            line = eval(f.readline().strip())
			
 
				+            lines.append(line)
			
 
				+
			
 
				+    with open(path1) as f:
			
 
				+        for x in range(30000):
			
 
				+            line = eval(f.readline().strip())
			
 
				+            lines.append(line)
			
 
				+
			
 
				+    random.shuffle(lines)
			
 
				+    print('读取数据完毕')
			
 
				+
			
 
				+    d=int(0.85*len(lines))
			
 
				+    length = len(lines[0])
			
 
				+
			
 
				+    train_x=[s[:length - 2] for s in lines[0:d]]
			
 
				+    train_y=[s[-1] for s in lines[0:d]]
			
 
				+    test_x=[s[:length - 2] for s in lines[d:]]
			
 
				+    test_y=[s[-1] for s in lines[d:]]
			
 
				+
			
 
				+    print('转换数据完毕')
			
 
				+
			
 
				+    ros = RandomOverSampler(random_state=0)
			
 
				+    X_resampled, y_resampled = ros.fit_sample(np.array(train_x), np.array(train_y))
			
 
				+
			
 
				+    print('数据重采样完毕')
			
 
				+
			
 
				+    return X_resampled,y_resampled,np.array(test_x),np.array(test_y)
			
 
				+
			
 
				+
			
 
				+train_x,train_y,test_x,test_y=read_data(file_path)
			
 
				+
			
 
				+train_x_a = train_x[:,:18*20]
			
 
				+train_x_a = train_x_a.reshape(train_x.shape[0], 18, 20, 1)
			
 
				+# train_x_b = train_x[:, 9*26:18*26]
			
 
				+# train_x_b = train_x_b.reshape(train_x.shape[0], 9, 26, 1)
			
 
				+train_x_c = train_x[:,18*20:]
			
 
				+
			
 
				+
			
 
				+def create_mlp(dim, regress=False):
			
 
				+    # define our MLP network
			
 
				+    model = Sequential()
			
 
				+    model.add(Dense(96, input_dim=dim, activation="relu"))
			
 
				+    model.add(Dense(96, activation="relu"))
			
 
				+
			
 
				+    # check to see if the regression node should be added
			
 
				+    if regress:
			
 
				+        model.add(Dense(1, activation="linear"))
			
 
				+
			
 
				+    # return our model
			
 
				+    return model
			
 
				+
			
 
				+
			
 
				+def create_cnn(width, height, depth, size=48, kernel_size=(5, 6), regress=False, output=24):
			
 
				+    # initialize the input shape and channel dimension, assuming
			
 
				+    # TensorFlow/channels-last ordering
			
 
				+    inputShape = (width, height, 1)
			
 
				+    chanDim = -1
			
 
				+
			
 
				+    # define the model input
			
 
				+    inputs = Input(shape=inputShape)
			
 
				+    # x = inputs
			
 
				+    # CONV => RELU => BN => POOL
			
 
				+    x = Conv2D(size, kernel_size, strides=2, padding="same")(inputs)
			
 
				+    x = Activation("relu")(x)
			
 
				+    x = BatchNormalization(axis=chanDim)(x)
			
 
				+
			
 
				+    # y = Conv2D(24, (2, 8), strides=2, padding="same")(inputs)
			
 
				+    # y = Activation("relu")(y)
			
 
				+    # y = BatchNormalization(axis=chanDim)(y)
			
 
				+
			
 
				+    # flatten the volume, then FC => RELU => BN => DROPOUT
			
 
				+    x = Flatten()(x)
			
 
				+    x = Dense(output)(x)
			
 
				+    x = Activation("relu")(x)
			
 
				+    x = BatchNormalization(axis=chanDim)(x)
			
 
				+    x = Dropout(0.2)(x)
			
 
				+
			
 
				+    # apply another FC layer, this one to match the number of nodes
			
 
				+    # coming out of the MLP
			
 
				+    x = Dense(output)(x)
			
 
				+    x = Activation("relu")(x)
			
 
				+
			
 
				+    # check to see if the regression node should be added
			
 
				+    if regress:
			
 
				+        x = Dense(1, activation="linear")(x)
			
 
				+
			
 
				+    # construct the CNN
			
 
				+    model = Model(inputs, x)
			
 
				+
			
 
				+    # return the CNN
			
 
				+    return model
			
 
				+
			
 
				+
			
 
				+# create the MLP and CNN models
			
 
				+mlp = create_mlp(train_x_c.shape[1], regress=False)
			
 
				+# cnn_0 = create_cnn(18, 21, 1, kernel_size=(3, 3), size=64, regress=False, output=128)       # 31 97 46
			
 
				+# cnn_0 = create_cnn(18, 21, 1, kernel_size=(6, 6), size=64, regress=False, output=128)         # 29 98 47
			
 
				+# cnn_0 = create_cnn(18, 21, 1, kernel_size=(9, 9), size=64, regress=False, output=128)         # 28 97 53
			
 
				+cnn_0 = create_cnn(18, 20, 1, kernel_size=(3, 20), size=96, regress=False, output=96)       #A23 99 33 A' 26 99 36 #B 34 98 43
			
 
				+# cnn_1 = create_cnn(18, 21, 1, kernel_size=(18, 11), size=96, regress=False, output=96)
			
 
				+# cnn_1 = create_cnn(9, 26, 1, kernel_size=(2, 14), size=36, regress=False, output=64)
			
 
				+
			
 
				+# create the input to our final set of layers as the *output* of both
			
 
				+# the MLP and CNN
			
 
				+combinedInput = concatenate([mlp.output, cnn_0.output])
			
 
				+
			
 
				+# our final FC layer head will have two dense layers, the final one
			
 
				+# being our regression head
			
 
				+x = Dense(1024, activation="relu", kernel_regularizer=regularizers.l1(0.003))(combinedInput)
			
 
				+x = Dropout(0.2)(x)
			
 
				+x = Dense(1024, activation="relu")(x)
			
 
				+x = Dense(1024, activation="relu")(x)
			
 
				+# 在建设一层
			
 
				+x = Dense(3, activation="softmax")(x)
			
 
				+
			
 
				+# our final model will accept categorical/numerical data on the MLP
			
 
				+# input and images on the CNN input, outputting a single value (the
			
 
				+# predicted price of the house)
			
 
				+model = Model(inputs=[mlp.input, cnn_0.input,], outputs=x)
			
 
				+
			
 
				+
			
 
				+print("Starting training ")
			
 
				+# h = model.fit(train_x, train_y, batch_size=4096*2, epochs=500, shuffle=True)
			
 
				+
			
 
				+# compile the model using mean absolute percentage error as our loss,
			
 
				+# implying that we seek to minimize the absolute percentage difference
			
 
				+# between our price *predictions* and the *actual prices*
			
 
				+opt = Adam(lr=1e-3, decay=1e-3 / 200)
			
 
				+model.compile(loss="categorical_crossentropy", optimizer=opt, metrics=['accuracy'])
			
 
				+
			
 
				+# train the model
			
 
				+print("[INFO] training model...")
			
 
				+model.fit(
			
 
				+    [train_x_c, train_x_a,], train_y,
			
 
				+    # validation_data=([testAttrX, testImagesX], testY),
			
 
				+    # epochs=int(3*train_x_a.shape[0]/1300),
			
 
				+    epochs=epochs,
			
 
				+    batch_size=2048, shuffle=True,
			
 
				+    callbacks=[early_stopping]
			
 
				+)
			
 
				+
			
 
				+model.save(model_path)
			
 
				+
			
 
				+test_x_a = test_x[:,:18*20]
			
 
				+test_x_a = test_x_a.reshape(test_x.shape[0], 18, 20, 1)
			
 
				+# test_x_b = test_x[:, 9*26:9*26+9*26]
			
 
				+# test_x_b = test_x_b.reshape(test_x.shape[0], 9, 26, 1)
			
 
				+test_x_c = test_x[:,18*20:]
			
 
				+
			
 
				+# make predictions on the testing data
			
 
				+print("[INFO] predicting house prices...")
			
 
				+score  = model.evaluate([test_x_c, test_x_a], test_y)
			
 
				+
			
 
				+print(score)
			
 
				+print('Test score:', score[0])
			
 
				+print('Test accuracy:', score[1])