import os
import sys
sys.path.append('..')
import code_pub.api_sqlite
import time
import urllib.request as urllib2
import urllib
from datetime import datetime
from datetime import timedelta
global stocks
global g_db_stock
global k_ri
global list_code
global conn_list, conn_k
list_code = []
server_root_path = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
create_teble_sql='''
create table if not exists stock(
[id] integer primary key autoincrement,
[date] datetime,
[open] float,
[high] float,
[low] float,
[close] float,
[volume] float,
[adj_close] float
)
'''
def init_db_sqlite():
global stocks
stocks = code_pub.api_sqlite.c_create_db(db_name="stock_code")
stocks.conn_db()
sql = 'select * from stock'
print(sql)
info = stocks.search_info(search_sql=sql)
cnt = 0
for i in info:
code = i[1]
name = i[2]
date = i[3]
list_code.append({"code": code, "name": name, "date_time": date})
cnt += 1
list_code.append({"code": "0A0001", "name": "上证指数", "date_time": "1990-12-01"})
list_code.append({"code": "399001", "name": "深证指数", "date_time": "1990-12-01"})
list_code.append({"code": "399006", "name": "创业板指", "date_time": "1990-12-01"})
print("cnt", cnt,type("上证指数"))
def init_db_code(code, date_start):
global g_db_stock
g_db_stock = code_pub.api_sqlite.c_create_db(db_name=code)
g_db_stock.conn_db()
g_db_stock.create_table(create_teble_sql)
sql = 'select * from stock order by id desc limit 1'
print(sql)
str_day = date_start
info = g_db_stock.search_info(search_sql=sql)
cnt = 0
for i in info:
print(i, type(i[0]), i[0])
str_day = i[1]
cnt += 1
print("day", cnt ,str_day)
return str_day
def day_plus(str):
day = datetime.strptime(str, "%Y-%m-%d")
return day
def day_str_change(str):
day = datetime.strptime(str, "%Y-%m-%d")
return day.strftime('%Y%m%d')
'''
def update_ri(code, date, open, high, low, close, volume, adj_close):
print code, date, open, high, low, close, volume, adj_close
k_ri.update({"code": code, "date": date}, {"$setOnInsert":{"open": open, "high": high,
"low": low, "close": close,
"volume": volume,
"adj_close": adj_close}}, upsert = True)
'''
def update_ri(code, date, close, high, low, open, pre_close, change_value, change_quote, turnover_rate, \
volume, turnover, total_market_value, market_capitalization, turnover_number):
print ("sql", code, date, close, high, low, open, pre_close, change_value, change_quote, turnover_rate, \
volume, turnover, total_market_value, market_capitalization, turnover_number)
sql = 'select * from stock where date = "%s" ' % (date)
print(sql)
info = g_db_stock.search_info(search_sql=sql)
cnt = len(list(info))
print("cnt", cnt, date)
if(0 == cnt):
sql = 'insert into stock (date, open, high, low, close, volume, adj_close) values ("%s", %f, %f, %f, %f, %f, %f)' % \
(date, open, high, low, close, change_quote, turnover_rate)
print(sql)
g_db_stock.update_info(update_sql=sql)
elif(1 < cnt):
print("---------------------error-----------------------",date)
'''
sql = 'delete from stock where date = "%s"' % (date)
print(sql)
g_db_stock.update_info(update_sql=sql)
sql = 'insert into stock (date, open, high, low, close, volume, adj_close) values ("%s", %f, %f, %f, %f, %f, %f)' % \
(date, open, high, low, close, change_quote, turnover_rate)
print(sql)
g_db_stock.update_info(update_sql=sql)
'''
'''
k_ri.update({"code": code, "date": date},
{"$setOnInsert": {"open": open, "high": high,
"low": low, "close": close,
"pre_close": pre_close,
"change_quote": change_quote,
"change_value": change_value,
"turnover_rate": turnover_rate,
"volume": volume,
"turnover": turnover,
"total_market_value": total_market_value,
"market_capitalization": market_capitalization,
"turnover_number": turnover_number}}, upsert=True)
'''
def stock_header(code):
url = 'http://quotes.money.163.com/service/chddata.html?code='
t1 = ('60', '900')
t2 = ('000', '002', '300', '200')
t3 = ('399001', '399006')
if code.startswith(t1):
str = '0' + code
elif code.startswith('000001'):
str = '0' + code
elif code.startswith(t3):
str = '1' + code
elif code.startswith(t2):
str = '1' + code
else:
str = code
print (code)
url = url + str
return url
'''
def stock_header(code):
url = 'http://table.finance.yahoo.com/table.csv?s='
t1 = ('60', '900')
t2 = ('000', '002', '300', '200')
t3 = ('399001','399006')
if code.startswith(t1):
str = code + '.ss'
elif code.startswith('000001'):
str = code + '.ss'
elif code.startswith(t3):
str = code + '.sz'
elif code.startswith(t2):
str = code + '.sz'
else:
str = code
print code
url = url + str
return url
'''
def deal_url(str_day, url):
if ("" == str_day):
print (url)
return url;
day = day_plus(str_day)
now = datetime.now()
if (day.strftime('%Y%m%d') >= now.strftime('%Y%m%d')):
print (day.strftime('%Y%m%d'), now.strftime('%Y%m%d'))
return ""
str_url = url + '&start=' + day.strftime('%Y%m%d') + '&end=' + now.strftime('%Y%m%d')
'''
mon1 = int(now.strftime('%m')) - 1
mon2 = int(day.strftime('%m')) - 1
str_url = url + '&d=%s&e=%s&f=%s&g=d&a=%s&b=%s&c=%s&ignore=.csv' % (
str(mon1), now.strftime('%d'), now.strftime('%Y'), str(mon2), day.strftime('%d'), day.strftime('%Y'))
'''
return str_url
def file_to_sql(code, content):
rows = content.split('\n')
rows.sort()
i = 0
cnt = len(rows) - 1
for row in rows:
if (0 == i):
i += 1
continue
if (i == cnt):
print ("end file", i)
break
split_row = row.split(",")
try:
full_data = []
for row_s in split_row:
str = row_s.replace("\r", '').replace('None', '0')
if ('' == str):
str = '0'
full_data.append(str)
if (16 != len(full_data)):
break
update_ri(code, full_data[0], float(full_data[3]), float(full_data[4]), float(full_data[5]),
float(full_data[6]), \
float(full_data[7]), float(full_data[8]), float(full_data[9]), float(full_data[10]),
float(full_data[11]), \
float(full_data[12]), float(full_data[13]), float(full_data[14]), float(full_data[15]))
except ValueError:
print ('\033[1;31;40m')
print (split_row)
print ("--------------------ValueError----------------------------------------------")
print ('\033[0m')
continue
i += 1
def get_day(code, url):
print (code, url)
if ("" == url):
print ("---newst---date---------------------------------")
return
req_header = {
'User-Agent': 'Mozilla/5.0 (Windows NT 6.1) AppleWebKit/537.11 (KHTML, like Gecko) Chrome/23.0.1271.64 Safari/537.11',
'Accept': 'text/html;q=0.9,*/*;q=0.8', 'Accept-Charset': 'ISO-8859-1,utf-8;q=0.7,*;q=0.3',
'Accept-Encoding': 'gzip', 'Connection': 'close', 'Referer': None
}
req_header = {('User-agent','Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9.0.1) Gecko/2008071615 Fedora/3.0.1-1.fc9 Firefox/3.0.1')}
req_timeout = 500
headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/50.0.2661.102 Safari/537.36'}
req = urllib2.Request(url = url,headers = headers)
try:
socket = urllib2.urlopen(req, None, req_timeout)
content = socket.read().decode('GB18030')
socket.close()
except urllib2.HTTPError as e:
print('\033[1;31;40m')
print('The server couldn\'t fulfill the request.')
print('Error code: ', e.code)
print('Error reason: ', e.reason)
print('\033[0m')
except urllib2.URLError as e:
print('\033[1;31;40m')
print('We failed to reach a server.')
print('Reason: ', e.reason)
print('\033[0m')
else:
file_to_sql(code, content)
class NoHistory(object):
def add(self, *a, **k): pass
def clear(self): pass
def browser(url):
print (url)
if ("" == url):
print ("---newst---date---------------------------------")
return ""
br = mechanize.Browser(history=NoHistory())
br.set_handle_equiv(True)
br.set_handle_redirect(True)
br.set_handle_referer(True)
br.set_handle_robots(False)
br.set_handle_refresh(mechanize._http.HTTPRefreshProcessor(), max_time=1)
br.set_debug_http(True)
br.set_debug_redirects(True)
br.set_debug_responses(True)
br.addheaders = [('User-agent', 'Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9.0.1) Gecko/2008071615 Fedora/3.0.1-1.fc9 Firefox/3.0.1')]
try:
r = br.open(url)
'''
for f in br.forms():
print f
br.select_form(nr = 0)
#搜索关键字“火车”
br.form['wd'] = "火车"
br.submit()
# 查看搜索结果
brr=br.response().read()
#是html代码,能看到火车的搜索结果
print brr
'''
content = r.read().strip()
'''
rows = content.split('\n')
rows.sort()
print rows
print "---------------"
print len(rows)
i = 0
cnt = len(rows) - 1
for row in rows:
print row
print cnt
'''
except:
print('\033[1;31;40m')
print("open err ------------------------------------")
print('\033[0m')
return ""
return content
def get_day_list(code, date_start):
str_day = init_db_code(code, date_start)
print(str_day)
url = stock_header(code)
print(url)
url = deal_url(str_day, url)
get_day(code, url)
g_db_stock.close_db()
if __name__ == '__main__':
init_db_sqlite()
print (len(list_code))
for i in list_code:
get_day_list(i["code"], i["date_time"])
stocks.close_db()```