|
|
## crontab不同机器上的备份
|
|
|
|
|
|
### 10.8.6.21
|
|
|
```
|
|
|
#工商主体司法标签
|
|
|
5 * * * * bash /home/collie/product/app_company_tag/deploy/company_risk_tag_daily.sh
|
|
|
|
|
|
# baidu_pc
|
|
|
#*/2 * * * * cd /home/collie/product/app_ad/jobs/data_pump && /home/collie/.conda/envs/collie/bin/python data_pump.py pump-data -c ../../data_pump/commit_baidu_pc_task.yml > /dev/null 2>&1
|
|
|
# baiduv
|
|
|
*/1 * * * * cd /home/collie/product/app_ad/jobs/data_pump && /home/collie/.conda/envs/collie/bin/python data_pump.py pump-data -c ../../data_pump/commit_baiduv_person_task.yml > /dev/null 2>&1
|
|
|
*/1 * * * * cd /home/collie/product/app_ad/jobs/data_pump && /home/collie/.conda/envs/collie/bin/python data_pump.py pump-data -c ../../data_pump/commit_baiduv_company_task.yml > /dev/null 2>&1
|
|
|
# 5118
|
|
|
*/1 * * * * cd /home/collie/product/app_ad/jobs/data_pump && /home/collie/.conda/envs/collie/bin/python data_pump.py pump-data -c ../../data_pump/commit_5118_task.yml > /dev/null 2>&1
|
|
|
# adbug提交任务
|
|
|
# */1 * * * * cd /home/collie/product/app_ad/jobs/data_pump && /home/collie/.conda/envs/collie/bin/python data_pump.py pump-data -c ../../data_pump/commit_adbug_task.yml > /dev/null 2>&1
|
|
|
# adbug从es获取任务提交
|
|
|
30 0 * * * cd /home/collie/product/app_ad/jobs/data_pump && /home/collie/.conda/envs/collie/bin/python data_pump.py pump-data -c ../../data_pump/commit_adbug_task_from_es.yml > /dev/null 2>&1
|
|
|
|
|
|
#7icp 爬虫
|
|
|
*/5 7-19 * * * flock -n /home/collie/product/offset_store/7icp-1.lock -c "/home/collie/.conda/envs/collie/bin/python product/app_icp/jobs/data_pump/data_pump.py pump-data --config product/app_icp/data_pump/7icp.yml --default_config product --assign_attrs province province_part1"
|
|
|
*/5 7-19 * * * flock -n /home/collie/product/offset_store/7icp-2.lock -c "/home/collie/.conda/envs/collie/bin/python product/app_icp/jobs/data_pump/data_pump.py pump-data --config product/app_icp/data_pump/7icp.yml --default_config product --assign_attrs province province_part2"
|
|
|
*/5 7-19 * * * flock -n /home/collie/product/offset_store/7icp-3.lock -c "/home/collie/.conda/envs/collie/bin/python product/app_icp/jobs/data_pump/data_pump.py pump-data --config product/app_icp/data_pump/7icp.yml --default_config product --assign_attrs province province_part3"
|
|
|
|
|
|
|
|
|
#zimi 爬虫
|
|
|
#*/5 7-19 * * * flock -n /home/collie/product/offset_store/zimi-1.lock -c "/home/collie/.conda/envs/collie/bin/python product/app_icp/jobs/data_pump/data_pump.py pump-data --config product/app_icp/data_pump/zimi.yml --default_config product --assign_attrs province province_part1"
|
|
|
#*/5 7-19 * * * flock -n /home/collie/product/offset_store/zimi-2.lock -c "/home/collie/.conda/envs/collie/bin/python product/app_icp/jobs/data_pump/data_pump.py pump-data --config product/app_icp/data_pump/zimi.yml --default_config product --assign_attrs province province_part2"
|
|
|
#*/5 7-19 * * * flock -n /home/collie/product/offset_store/zimi-3.lock -c "/home/collie/.conda/envs/collie/bin/python product/app_icp/jobs/data_pump/data_pump.py pump-data --config product/app_icp/data_pump/zimi.yml --default_config product --assign_attrs province province_part3"
|
|
|
|
|
|
# baidu_index
|
|
|
*/1 * * * * /home/collie/.conda/envs/collie/bin/python /home/collie/product/app_search_ads/jobs/data_pump/data_pump.py pump-data --config /home/collie/product/app_search_ads/data_pump/baidu_index.yml --default_config commit_baidu_index_task
|
|
|
|
|
|
(base) [collie@bdp-server-001 yuanb]$ crontab -l | grep baiduv
|
|
|
# baiduv
|
|
|
*/1 * * * * cd /home/collie/product/app_ad/jobs/data_pump && /home/collie/.conda/envs/collie/bin/python data_pump.py pump-data -c ../../data_pump/commit_baiduv_person_task.yml > /dev/null 2>&1
|
|
|
*/1 * * * * cd /home/collie/product/app_ad/jobs/data_pump && /home/collie/.conda/envs/collie/bin/python data_pump.py pump-data -c ../../data_pump/commit_baiduv_company_task.yml > /dev/null 2>&1
|
|
|
```
|
|
|
|
|
|
### 10.8.6.23
|
|
|
```
|
|
|
# 每天5点30
|
... | ... | @@ -67,6 +104,100 @@ |
|
|
10 10 * * * cd /home/collie && /home/collie/.conda/envs/collie/bin/python /home/collie/product/app_public_company/jobs/data_pump/data_pump.py pump-data --config /home/collie/product/app_ic/data_pump/general_ic_old.yml --default_config QH
|
|
|
```
|
|
|
|
|
|
### 10.8.6.47
|
|
|
```
|
|
|
####
|
|
|
# {minute} {hour} {day-of-month} {month} {day-of-week} {full-path-to-shell-script}
|
|
|
# minute: 区间为 0 – 59
|
|
|
# hour: 区间为0 – 23
|
|
|
# day-of-month: 区间为0 – 31
|
|
|
# month: 区间为1 – 12. 1 是1月. 12是12月.
|
|
|
# Day-of-week: 区间为0 – 7. 周日可以是0或7.
|
|
|
####
|
|
|
|
|
|
# tyc每日例行--工商变更以及关联主体的电话数据推送部署 20201216停止更新:
|
|
|
# 00 01 * * * bash /home/collie/product/app_ic_change_info/deploy/data_pump_push_contact.sh
|
|
|
|
|
|
# tyc每日例行--t_05数据库--招投标
|
|
|
#*/30 * * * * bash /home/collie/product/app_lake/cron/data_pump_tyc_t_05_bid.sh company_bid
|
|
|
|
|
|
# 推送当日新成立企业数据,工作日13点和18点
|
|
|
# 05 13 * * 1,2,3,4,5 bash /home/collie/product/app_ic_change_info/cron/job_one_ftp_hour_13.sh
|
|
|
# 05 18 * * 1,2,3,4,5 bash /home/collie/product/app_ic_change_info/cron/job_one_ftp_hour_18.sh
|
|
|
|
|
|
# 西藏商品爬虫入库(部署为superviror,不用cron)
|
|
|
# 00 06 2,16 * * bash /home/collie/product/app_spider_result/deploy/data_pump_spider_goods.sh
|
|
|
|
|
|
# 对外输出的新成立企业
|
|
|
#*/5 * * * * cd /home/collie/product/app_ic_new/jobs/data_pump && /home/collie/.conda/envs/collie/bin/python data_pump.py pump-data --config ../../data_pump/all_sync_output.yml
|
|
|
|
|
|
# 新成立企业上线监控
|
|
|
10 9-20 * * * cd /home/collie/product/app_ic_new/monitor_new && /home/collie/.conda/envs/collie/bin/python monitor_ic.py
|
|
|
|
|
|
# 未上线新成立企业提交
|
|
|
10 8,10,15 * * * cd /home/collie/product/app_ic_new/jobs/data_pump/ && /home/collie/.conda/envs/collie/bin/python data_pump.py pump-data --config ../../data_pump/all_table_crawler_online.yml --default_config old_fail &
|
|
|
|
|
|
# spider--1688_shops(每周二爬一遍所有的店铺)
|
|
|
# 00 09 * * 2 bash /home/collie/product/app_1688/data_pump/spider_job.sh 1688_shops 1>/dev/null
|
|
|
|
|
|
# icp每日例行导出--奇虎
|
|
|
00 01 * * * bash /home/collie/product/app_icp/deploy/icp_data_export_day.sh
|
|
|
# icp每日例行导出--搜狗
|
|
|
05 * * * * bash /home/collie/product/app_icp/deploy/icp_data_export_hour.sh
|
|
|
|
|
|
# 工商api查不到的搜索词提交爬虫
|
|
|
10 * * * * cd /home/collie/product/app_ic_complement/jobs/data_pump && /home/collie/.conda/envs/collie/bin/python data_pump.py pump-data --config ../../data_pump/api_not_result_keyword.yml
|
|
|
40 * * * * cd /home/collie/product/app_ic_complement/jobs/data_pump && /home/collie/.conda/envs/collie/bin/python data_pump.py pump-data --config ../../data_pump/api_not_result_keyword.yml --default_config zongju_pc
|
|
|
|
|
|
#国网任务提交
|
|
|
#00 10 * * * /home/collie/.conda/envs/collie/bin/ansible-playbook -i product/app_sgcc/ansible/hosts.ini product/app_sgcc/ansible/sgcc_kill.yaml product/app_sgcc/ansible/sgcc_run.yaml
|
|
|
#30 10 * * * /home/collie/.conda/envs/collie/bin/python product/app_sgcc/jobs/data_pump/data_pump.py pump-data -c product/app_sgcc/data_pump/submit_task.yml --default_config product_submit_task
|
|
|
#00 16 * * * /home/collie/.conda/envs/collie/bin/python product/app_sgcc/jobs/data_pump/data_pump.py pump-data -c product/app_sgcc/data_pump/submit_task.yml --default_config product_submit_task_fail
|
|
|
|
|
|
|
|
|
#搜索广告相关
|
|
|
#获取1小时内变化的企业,提交更新统计信息
|
|
|
0 * * * * /home/collie/.conda/envs/collie/bin/python product/app_search_ads/jobs/data_pump/data_pump.py pump-data --config product/app_search_ads/data_pump/adsearch_v2.yml --default_config get_changed_companies
|
|
|
#45 * * * * /home/collie/.conda/envs/collie/bin/python product/app_search_ads/jobs/data_pump/data_pump.py pump-data --config product/app_search_ads/data_pump/adsearch_v2.yml --default_config get_changed_words
|
|
|
|
|
|
#电商数据准备,每隔2小时执行一次
|
|
|
0 */2 * * * /home/collie/.conda/envs/collie/bin/python /home/collie/product/app_eb_app/jobs/data_pump/data_pump.py pump-data --config /home/collie/product/app_eb_app/data_pump/conv_ebusiness_data.yml --default_config 'conv'
|
|
|
#APP数据准备
|
|
|
#小米APP数据,每月15号2点执行一次
|
|
|
0 2 15 * * /home/collie/.conda/envs/collie/bin/python /home/collie/product/app_eb_app/jobs/data_pump/data_pump.py pump-data --config /home/collie/product/app_eb_app/data_pump/conv_app_data.yml --default_config 'xiaomi'
|
|
|
#华为APP数据,每月15号2点执行一次
|
|
|
0 2 15 * * /home/collie/.conda/envs/collie/bin/python /home/collie/product/app_eb_app/jobs/data_pump/data_pump.py pump-data --config /home/collie/product/app_eb_app/data_pump/conv_app_data.yml --default_config 'huawei'
|
|
|
|
|
|
# 法院公告数据写文件
|
|
|
05 01 * * * cd /home/collie/product/app_court_notice/jobs/data_pump && /home/collie/.conda/envs/collie/bin/python data_pump.py pump-data --config ../../data_pump/app_parse_court_notice.yml > court_notice_parse.log 2>&1 &
|
|
|
# 法院公告数据文件入库
|
|
|
05 03 * * * cd /home/collie/product/app_risk/jobs/data_pump && /home/collie/.conda/envs/collie/bin/python data_pump.py pump-data --config ../../data_pump/risk_court_spider.yml --default_config spider_court_notices_re_to_mysql > court_notice_db.log 2>&1
|
|
|
# 法院公告数据初始解析预警
|
|
|
05 05 * * * bash /home/collie/product/app_risk/deploy/risk_court_notice_warning.sh
|
|
|
# 法院公告数据初始5个json格式网站入库
|
|
|
05 06 * * * cd /home/collie/product/app_risk/jobs/data_pump && /home/collie/.conda/envs/collie/bin/python data_pump.py pump-data --config ../../data_pump/risk_court_spider.yml --default_config spider_court_notices_re_to_sd_json_web > court_notice_5_json_web.log 2>&1
|
|
|
# 法院公告非json格式网站入库
|
|
|
05 07 * * * cd /home/collie/product/app_risk/jobs/data_pump && /home/collie/.conda/envs/collie/bin/python data_pump.py pump-data --config ../../data_pump/risk_court_spider.yml --default_config spider_court_notices_re_to_sd_not_json_web > court_notice_not_json_web.log 2>&1
|
|
|
# 开庭公告的网站入库
|
|
|
05 07 * * * cd /home/collie/product/app_risk/jobs/data_pump && /home/collie/.conda/envs/collie/bin/python data_pump.py pump-data --config ../../data_pump/risk_court_spider.yml --default_config spider_court_announcement_re_to_sd > court_announcement.log 2>&1
|
|
|
|
|
|
50 15 * * * bash /home/collie/product/app_mongo_renovate/deploy/renovate_error_credit_no.sh
|
|
|
|
|
|
# 裁判文书数据解析
|
|
|
10 0 * * * /home/collie/.conda/envs/collie/bin/python /home/collie/product/app_conv_file/jobs/data_pump/data_pump.py pump-data --config /home/collie/product/app_conv_file/data_pump/wenshu_conv_file.yml >> /home/collie/product/app_conv_file/data_pump/app_conv_file.log 2>&1
|
|
|
|
|
|
# PDD相似商品数据入库
|
|
|
10 2 * * * /home/collie/.conda/envs/collie/bin/python /home/collie/product/app_conv_ebusiness/jobs/data_pump/data_pump.py pump-data --config /home/collie/product/app_conv_ebusiness/data_pump/conv_pdd_reco_goods.yml & >> /home/collie/product/app_conv_ebusiness/data_pump/conv_pdd_reco_goods.log 2>&1
|
|
|
|
|
|
|
|
|
# 司法拍卖解析
|
|
|
55 09 * * * /home/collie/.conda/envs/collie/bin/python /home/collie/product/app_tb_judicial_sale/jobs/data_pump/data_pump.py pump-data -c /home/collie/product/app_tb_judicial_sale/data_pump/parse_data.yml
|
|
|
55 09 * * * /home/collie/.conda/envs/collie/bin/python /home/collie/product/app_tb_judicial_sale/jobs/data_pump/data_pump.py pump-data -c /home/collie/product/app_tb_judicial_sale/data_pump/parse_add_time.yml
|
|
|
|
|
|
#增量数据同步情况监控
|
|
|
0 1 * * * /home/collie/.conda/envs/collie/bin/python /home/collie/product/app_maxwell/jobs/data_pump/data_pump.py pump-data -c /home/collie/product/app_maxwell/data_pump/update_data_monitor/update_data_monitor.yml
|
|
|
```
|
|
|
|
|
|
### 10.8.6.63
|
|
|
```
|
|
|
#国网任务提交
|
... | ... | |