第25月第7天聚宽 svm

# 克隆自聚宽文章：https://www.joinquant.com/post/2709

# 标题：基于SVM的机器学习策略

# 作者：走得很慢的海龟

import math

import numpy as np

#from sklearn import preprocessing, cross_validation, svm

from sklearn import preprocessing, svm

import matplotlib.pyplot as plt

from matplotlib import style

import sklearn

import time

from datetime import datetime

import cPickle as pickle

def initialize(context):

    g.train=True

# year_date is for get_fundamentals

def train_data(year_date, index_date):

    Valuation=[]

    price=[]

    status=[]

    SZ1=get_index_stocks('399008.XSHE', date=index_date)

    SZ2=get_index_stocks('399012.XSHE', date=index_date)

    SH=get_index_stocks('399905.XSHE', date=index_date)

    tem_index=SZ1+SZ2+SH

    unix_30d=60*60*24*30

    unix_weekend=60*60*24*3

    q=query(

    income.code, income.pubDate, income.total_operating_revenue,

    income.total_operating_cost, income.administration_expense,

    income.operating_profit, income.non_operating_revenue,

    income.total_profit, income.net_profit, income.basic_eps,

    income.diluted_eps, income.total_composite_income

    ).filter(

    valuation.code.in_(tem_index))

    incm = get_fundamentals(q, statDate=year_date)

    date=incm['pubDate']

    index=incm['code']

    q=query(

    indicator

    ).filter(

    valuation.code.in_(index))

    indictor=get_fundamentals(q, statDate=year_date)

    del(indictor['code'], indictor['statDate'], indictor['pubDate'])

    for each in range(0,len(date)):

        q=query(

        valuation.pe_ratio, valuation.pb_ratio, valuation.circulating_market_cap

        ).filter(

        valuation.code==(index[each]))

        each_valuation=get_fundamentals(q, date=date[each])

        date_stamp = datetime.strptime(date[each], '%Y-%m-%d')

        unix=time.mktime(date_stamp.timetuple())

        unix_30_late=unix+unix_30d

        Valuation.append(each_valuation.iloc[0].tolist())

        p1=get_price(index[each], start_date=date[each],

        end_date=date[each], frequency='daily', fields='close')

        if not p1.empty:

            pass

        else:

            p1_weekend=datetime.fromtimestamp(unix-unix_weekend).strftime('%Y-%m-%d')

            p1=get_price(index[each], start_date=p1_weekend,

            end_date=p1_weekend, frequency='daily', fields='close')

        p1_30d=datetime.fromtimestamp(unix_30_late).strftime('%Y-%m-%d')

        p2=get_price(index[each], start_date=p1_30d,

        end_date=p1_30d, frequency='daily', fields='close')

        if not p2.empty:

            pass

        else:

            date_stamp2 = datetime.strptime(p1_30d, '%Y-%m-%d')

            unix2=time.mktime(date_stamp2.timetuple())

            unix2_weekend=unix2-unix_weekend

            p2_weekend=datetime.fromtimestamp(unix2_weekend).strftime('%Y-%m-%d')

            p2=get_price(index[each], start_date=p2_weekend,

            end_date=p2_weekend, frequency='daily', fields='close')

        dif =  p2.values / p1.values

        if dif > 1.1:

            s=1

        else:

            s=0

        status.append(s)

        price.append(p1.iloc[0].tolist())

    Valuation=pd.DataFrame(Valuation, columns=['pe','pb','cir_mkt_cap'])

    price=pd.DataFrame(price, columns=['price'])

    status=pd.DataFrame(status, columns=['status'])

    df=pd.concat([incm,Valuation,price,indictor,status], axis=1)

    del(df['pubDate'], df['statDate.1'], df['code'])

    #y=df['status'].values.tolist()

    #df=np.random.permutation(df)

    #del(df['status'], df['code'])

    #X=np.array(df.replace('NaN', 9999).values.tolist())

    #X=preprocessing.scale(X)

    return df

def fundamental(index):

    Valuation=[]

    price=[]

    status=[]

    q=query(

    income.total_operating_revenue,

    income.total_operating_cost, income.administration_expense,

    income.operating_profit, income.non_operating_revenue,

    income.total_profit, income.net_profit, income.basic_eps,

    income.diluted_eps, income.total_composite_income

    ).filter(

    valuation.code.in_(index))

    incm = get_fundamentals(q)

    q=query(

    valuation.pe_ratio, valuation.pb_ratio, valuation.circulating_market_cap

    ).filter(

    valuation.code.in_(index))

    Valuation=get_fundamentals(q)#.values.tolist()

    q=query(

    indicator

    ).filter(

    valuation.code.in_(index))

    indictor=get_fundamentals(q)#.values.tolist()

    index2=indictor['code']

    del(indictor['code'], indictor['statDate'], indictor['pubDate'], indictor['day'])

    for each in index2:

        p=attribute_history(each, 1, unit='1d', fields=['close'], skip_paused=True)

        price.append(p.iloc[0].tolist())

    price=pd.DataFrame(price, columns=['price'])

    df=pd.concat([incm,Valuation,price,indictor], axis=1)

    X=np.array(df.replace('NaN', 9999).values.tolist())

    X=preprocessing.scale(X)

    return X, index2

def handle_data(context, data):

    if g.train:

        index_date=str('2014-03-01')

        df1=train_data(str('2014q1'),index_date)

        df2=train_data(str('2014q2'),index_date)

        df3=train_data(str('2014q3'),index_date)

        df4=train_data(str('2014q4'),index_date)

        df=pd.concat([df1,df2,df3,df4], axis=0)

        df.iloc[np.random.permutation(len(df))]

        y=df['status'].values.tolist()

        del(df['status'])

        log.info("<===== shape of training dataset @ %s", str(df.shape))

        X=np.array(df.replace('NaN', 9999).values.tolist())

        X=preprocessing.scale(X)

        clf = svm.SVC(kernel=str("linear"), C=1.0)

        clf.fit(X, y)

        filename = "temp.pkl"

        pickle_file = open(filename, 'wb')

        pickle.dump(clf, pickle_file)

        pickle_file.close()

        g.train=False

    filename = "temp.pkl"

    pickle_file = open(filename, 'rb')

    clf = pickle.load(pickle_file)

    year=context.current_dt.year

    month=context.current_dt.month

    day=context.current_dt.day

    index_date=str(year)+'-'+str(month)+'-'+str(day)

    SZ1=get_index_stocks('399008.XSHE', date=index_date)

    SZ2=get_index_stocks('399012.XSHE', date=index_date)

    SH=get_index_stocks('399905.XSHE', date=index_date)

    index=SZ1+SZ2+SH

    X, index2=fundamental(index)

    for each in range(0, len(index2)):

        if clf.predict(X[each].reshape(1,X.shape[1]))[0] == 1 and index2[each] not in context.portfolio.positions.keys():

            log.info("===================Buying:", index2[each])

            order_target_value(index2[each], context.portfolio.cash/5)

        if clf.predict(X[each].reshape(1,X.shape[1]))[0] == 0 and index2[each] in context.portfolio.positions.keys():

            log.info("<<<<<<<<<<<<<<<<<<Holding:", context.portfolio.positions.keys())

            log.info("-------------------selling:", index2[each])

            order_target(index2[each], 0)

# 止损

    if context.portfolio.positions:

        for stock in context.portfolio.positions.keys():

            cur_price = data[stock].close

            position=context.portfolio.positions[stock]

            if cur_price > position.avg_cost * (1 + 0.5) or cur_price < position.avg_cost * (1 - 0.2):

                order_target(stock, 0)

                log.info("<<<<<<<<<<<", stock, "%s lose:", 1-cur_price/position.avg_cost)

　　https://www.joinquant.com/

https://zhuanlan.zhihu.com/p/24649311

第25月第7天聚宽 svm的更多相关文章

聚宽投资研究获取A股05年至今全部数据
#用中正全指'000985.XSHG'获取全部A股数据pool=get_index_stocks('000985.XSHG') #date存储05年开始全部交易时间 date=get_price('0 ...
金融量化分析【day113】：聚宽自带策略
一.策略代码 # 导入函数库 from jqdata import * # 初始化函数,设定基准等等 def initialize(context): # 设定沪深300作为基准 set_benchm ...
聚宽获取财务数据+DataFrame写入txt
from jqdata import jy from jqdata import * #获取股票列表,这里是板块内股票 pool=get_industry_stocks(',date='2016-09 ...
第25月第26天 dispatch_group_t dispatch_semaphore_t
1. dispatch_group_enter(group); dispatch_group_leave(group); dispatch_group_notify(group1, queue1,bl ...
第25月25日 urlsession
1. private lazy var session: URLSession = { let configuration = URLSessionConfiguration.default conf ...
第25月第22日 django channels
1. https://github.com/andrewgodwin/channels-examples/ https://channels.readthedocs.io/en/latest/
第25月第18天 vue
1.cnpm sudo chown -R $USER /usr/local npm install -g cnpm --registry=https://registry.npm.taobao.or ...
第25月第17天 django rest framwork authentication /tmp/mysql.sock
1.authentication https://www.django-rest-framework.org/api-guide/authentication/#authentication 2.dj ...
第25月第15天 udacity cs253
1.cs253 https://classroom.udacity.com/courses/cs253 webapp2 Install WebOb, Paste and webapp2¶ We nee ...

随机推荐

zabbix自动发现
zabbix3.4 Discovery自动发现教程 Zabbix 创建发现规则创建发现规则配置 ---- 自动发现 ---- 创建发现规则看一个例子这样发现规则就没有问题了,下面让主机自动加入到某 ...
JAVA版本8u171与8u172的区别
用了java 7好几年了,今天闲来无事,想升级到 java 8,到官网下载的时候发现JAVA放出了8u171与8u172两个版本. 什么情况? 百度一下找到答案:https://blog.csdn.n ...
java 分隔函数split("",-1)的用途
转: java 分隔函数split("",-1)的用途 2017年12月14日 11:37:58 jaryle 阅读数:8517 1.如果字符串最后一位有值,则没有区别, 2. ...
#ifndef HeaderName_h #define HeaderName_h #endif 使用详解(转)
原文:#ifndef HeaderName_h #define HeaderName_h #endif 使用详解想必很多人都看到过头文件中写有:#ifndef HeaderName_h ...
Codeforces Gym 191033 E. Explosion Exploit （记忆化搜索+状压）
E. Explosion Exploit time limit per test 2.0 s memory limit per test 256 MB input standard input out ...
（贪心）nyoj91-阶乘之和
91-阶乘之和内存限制:64MB 时间限制:3000ms 特判: No 通过数:71 提交数:191 难度:3 题目描述: 给你一个非负数整数n,判断n是不是一些数(这些数不允许重复使用,且为正数) ...
Mac 软件专题之：OS X Yosemite 精彩应用软件推荐
目前,很多软件都已经发布了针对Yosemite系统的版本,今天和大家分享专题:「OS X Yosemite 精彩应用」,主要分享适配Yosemite系统全新的扁平化界面和新功能的软件,但要知道未在此专 ...
hdu 2815 Mod Tree (exBSGS)
http://acm.hdu.edu.cn/showproblem.php?pid=2815 //解 K^D ≡ N mod P #include<map> #include<cma ...
python--numpy、pandas
numpy 与 pandas 都是用来对数据进行处理的模块, 前者以array 为主体,后者以 DataFrame 为主体(让我想起了Spark的DataFrame 或RDD) 有说 pandas 是 ...
mysql创建用户与pymsql模块
mysql 创建用户及增删改查创建mysql 用户 with grant option 表示用户不存在自主创建 grant [ select ……,insert ……| all ] on 库名.表名 ...

第25月第7天 聚宽 svm

第25月第7天 聚宽 svm的更多相关文章

随机推荐

热门专题

第25月第7天聚宽 svm

第25月第7天聚宽 svm的更多相关文章