-
Notifications
You must be signed in to change notification settings - Fork 1
/
queue_tranco.sh
executable file
·46 lines (38 loc) · 1.68 KB
/
queue_tranco.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
#!/bin/bash
# INDIR="celery_workers/vv8_worker/vv8_crawler/extensionsSome/"
# INDIR="celery_workers/vv8_worker/vv8_crawler/extracted/"
# INDIR="celery_workers/vv8_worker/vv8_crawler/extensionsDefault129/"
# INDIR="celery_workers/vv8_worker/vv8_crawler/selected_extensions/"
# TODO:
# 1) docker compose down
# 1b) delete some of the stuff, not the DB, not the raw_logs
# sudo rm -rf har/ redis_data/ parsed_logs/ screenshots/ mongo/data/ ./scripts/.vv8.db
# 1c) maybe add the docker remove and the docker stop/start stuff from here: https://github.com/moby/moby/issues/10589#issuecomment-222468296
# 2) docker setup -y -y -160 -y
# 3) requeue next URL [eg: [2] of list of [12-15]
# INDIR="celery_workers/vv8_worker/vv8_crawler/ALL_EXTENSIONS40k/"
INDIR="celery_workers/vv8_worker/vv8_crawler/ALL_EXTENSIONS1k/" # this is for benign samples (from the wild) -> 528
# INDIR="celery_workers/vv8_worker/vv8_crawler/merged_folder_6_parts/" # this is for malicious samples (v2 from v2-v3) 517
for i in {0..11}
do
first="$i"
last="$((i+1))"
session_name="queue-$i"
tmux new-session -d -s $session_name "bash python3 crawler_queue_tranco.py -i $INDIR -s $first -e $last"
# python3 queue.py -i $INDIR -s $first -e $last
done
# first=0
# last=1
# INDIR="celery_workers/vv8_worker/vv8_crawler/ALL_EXTENSIONS40k/"
# # INDIR="celery_workers/vv8_worker/vv8_crawler/out_mal_ext_34/"
# python3 queue.py -i $INDIR -s $first -e $last
# tmux new-session -d -s my_session 'ruby run.rb'
# catapultos:
# restart: unless-stopped
# ports:
# - "8080:8080/tcp"
# - "8081:8081/tcp"
# build:
# context: ./celery_workers
# dockerfile: catapultos.dockerfile
# image: catapultos