mirror of https://github.com/midoks/mdserver-web
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
52 lines
1.7 KiB
52 lines
1.7 KiB
#!/usr/bin/env python
|
|
# coding: utf8
|
|
"""
|
|
从MySQL数据库中读取未索引的资源,更新到Sphinx的实时索引中。
|
|
xiaoxia@xiaoxia.org
|
|
2015.5 created
|
|
"""
|
|
|
|
import time
|
|
import MySQLdb as mdb
|
|
import MySQLdb.cursors
|
|
|
|
SRC_HOST = '127.0.0.1'
|
|
SRC_USER = 'root'
|
|
SRC_PASS = 'root'
|
|
DST_HOST = '127.0.0.1'
|
|
DST_USER = 'root'
|
|
DST_PASS = 'root'
|
|
|
|
src_conn = mdb.connect(SRC_HOST, SRC_USER, SRC_PASS, 'ssbc',
|
|
charset='utf8', cursorclass=MySQLdb.cursors.DictCursor)
|
|
src_curr = src_conn.cursor()
|
|
src_curr.execute('SET NAMES utf8')
|
|
|
|
dst_conn = mdb.connect(DST_HOST, DST_USER, DST_PASS,
|
|
'rt_main', port=9306, charset='utf8')
|
|
dst_curr = dst_conn.cursor()
|
|
dst_curr.execute('SET NAMES utf8')
|
|
|
|
|
|
def work():
|
|
src_curr.execute('SELECT id, name, CRC32(category) AS category, length, UNIX_TIMESTAMP(create_time) AS create_time, ' +
|
|
'UNIX_TIMESTAMP(last_seen) AS last_seen FROM search_hash WHERE tagged=false LIMIT 10000')
|
|
total = src_curr.rowcount
|
|
print 'fetched', total
|
|
for one in src_curr:
|
|
ret = dst_curr.execute('insert into rt_main(id,name,category,length,create_time,last_seen) values(%s,%s,%s,%s,%s,%s)',
|
|
(one['id'], one['name'], one['category'], one['length'], one['create_time'], one['last_seen']))
|
|
if ret:
|
|
src_curr.execute(
|
|
'UPDATE search_hash SET tagged=True WHERE id=%s', (one['id'],))
|
|
print 'Indexed', one['name'].encode('utf8')
|
|
print 'Done!'
|
|
return total
|
|
|
|
if __name__ == '__main__':
|
|
while True:
|
|
if work() == 10000:
|
|
print 'Continue...'
|
|
continue
|
|
print 'Wait 10mins...'
|
|
time.sleep(600)
|
|
|