blob: 6c97a3cb994274fa8c4137020c1f016993243fc0 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
|
import pandas
import os
import ast
import twint
import requests
def download(url):
filename = url.split("/")[-1]
r = requests.get(url, allow_redirects=True)
with open("pics/" + filename, "wb") as f:
f.write(r.content)
# archive @AceYuriBot for images/sources
c = twint.Config()
c.Username = "AceYuriBot"
c.Images = True
c.Store_csv = True
c.Output = "yuribot.csv"
twint.run.Search(c)
os.makedirs("pics", exist_ok=True)
df = pandas.read_csv("yuribot.csv")
source = (
df["urls"].apply(lambda x: ast.literal_eval(x)).apply(lambda x: x[0] if x else None)
)
file_location = df["photos"].apply(lambda x: os.path.basename(ast.literal_eval(x)[0]))
# save to file where bot will pull data from
pandas.concat([source, file_location], axis=1).to_csv("files.csv")
# download images
df["photos"].apply(lambda x: download(ast.literal_eval(x)[0]))
|