idl_tv_article_marketing_detail.py 969 B

12345678910111213141516171819202122232425262728293031323334353637
  1. #!/usr/bin/env python
  2. #coding=utf-8
  3. """新剧营销文章链接爬取
  4. """
  5. import os
  6. import sys
  7. from fty_util.common import Mysql, Util
  8. reload(sys)
  9. sys.setdefaultencoding('utf8')
  10. first_day = Util.get_first_date_of_yesterday()
  11. conn = Mysql.createOfflineConn()
  12. sql = """
  13. select count(*) as num from scrapy.scrapy_article
  14. """
  15. row = Mysql.getOne(sql, conn=conn)
  16. if row is not None and row[0] is not None and row[0] > 0:
  17. # 清空数据
  18. sql = """
  19. truncate table idl.tv_article_marketing_detail
  20. """
  21. Mysql.execute(sql, conn=conn)
  22. sql = """
  23. insert into idl.tv_article_marketing_detail (tv_id, tv_name, search_type, media_name, search_restrict_url, scrapy_url, scrapy_title, scrapy_date)
  24. select tv_id, tv_name, search_type, media_name, search_restrict_url, scrapy_url, scrapy_title, date_format(scrapy_date, '%Y-%m-%d') from scrapy.scrapy_article order by id asc
  25. """
  26. Mysql.execute(sql, conn=conn)
  27. Mysql.close(conn)