config.py 850 B

123456789101112131415161718192021
  1. #!/usr/bin/env python3
  2. # -*- encoding: utf-8 -*-
  3. # URL与URL描述的对应关系. 这些关系从网站的HTML 的 <a>标签中提取得到
  4. mirror_site_folder = "/data/pub/websites"
  5. ignored_title = {"(更多…)", "trackback", "取消回复", "RSS 2.0", "Prev", "Next", }
  6. domain_mapping = {
  7. "www.taobaodba.com" : "http://taobaodba.ruoguschool.com",
  8. "www.searchtb.com" : "http://searchtb.ruoguschool.com",
  9. "www.tbdata.org" : "http://tbdata.ruoguschool.com",
  10. "www.taobaotest.com" : "http://taobaotest.ruoguschool.com",
  11. "csrd.aliapp.com" : "http://csrd.ruoguschool.com",
  12. "www.alidata.org" : "http://alidata.ruoguschool.com/archives",
  13. "blog.linezing.com" : "http://linezing.ruoguschool.com",
  14. "techshow.ctrip.com" : "http://techshow.ruoguschool.com",
  15. "rdc.taobao.com": "http://rdc.ruoguschool.com",
  16. "lamp.baidu.com": "http://lamp.ruoguschool.com",
  17. }