cleanup
parent
373f3ab661
commit
55484ebf11
@ -1,24 +0,0 @@
|
||||
import config
|
||||
|
||||
db, cursor = config.gen_connection()
|
||||
|
||||
cursor.execute("SELECT DISTINCT username FROM media WHERE user_id IS NULL AND platform = 'instagram';")
|
||||
usernames = [username[0] for username in cursor.fetchall()]
|
||||
|
||||
for username in usernames:
|
||||
print(f"Username: {username}")
|
||||
|
||||
cursor.execute("SELECT DISTINCT user_id FROM media WHERE username = %s AND user_id IS NOT NULL;", [username])
|
||||
possible_user_ids = [user_id for user_id, in cursor.fetchall()]
|
||||
if len(possible_user_ids) == 0:
|
||||
print(f"No user_id found for {username}")
|
||||
continue
|
||||
|
||||
if len(possible_user_ids) > 1:
|
||||
print(f"Multiple user_ids found for {username}: {possible_user_ids}")
|
||||
continue
|
||||
|
||||
user_id = possible_user_ids[0]
|
||||
cursor.execute("UPDATE media SET user_id = %s WHERE username = %s AND user_id IS NULL;", [user_id, username])
|
||||
db.commit()
|
||||
print(f"[{cursor.rowcount}] Updated user_id for {username}")
|
||||
@ -1,41 +0,0 @@
|
||||
import config
|
||||
import requests
|
||||
|
||||
def is_url_accessible(url):
|
||||
try:
|
||||
response = requests.head(url, timeout=5) # HEAD request is usually faster and enough to check availability
|
||||
return response.status_code == 200
|
||||
except requests.RequestException:
|
||||
return False
|
||||
|
||||
media_names = ['mediaUrl', 'mediaPreviewUrl']
|
||||
|
||||
db, cursor = config.gen_connection()
|
||||
|
||||
for media_type in media_names:
|
||||
cursor.execute(f"SELECT id, {media_type} FROM snapchat_stories WHERE {media_type} NOT LIKE 'https://cf-st.sc-cdn.net/d/%' AND status != 'inactive'")
|
||||
|
||||
rows = cursor.fetchall()
|
||||
total = len(rows)
|
||||
count = 0
|
||||
|
||||
for row in rows:
|
||||
count += 1
|
||||
record_id, original_url = row
|
||||
|
||||
media_id = original_url.split('/')[-1]
|
||||
new_url = f'https://cf-st.sc-cdn.net/d/{media_id}'
|
||||
|
||||
if is_url_accessible(new_url):
|
||||
print(f"✅ [{count} / {total}] {new_url} is accessible (converted from {original_url})")
|
||||
|
||||
cursor.execute(f"UPDATE snapchat_stories SET {media_type} = %s, status = 'updated' WHERE id = %s", (new_url, record_id))
|
||||
db.commit()
|
||||
continue
|
||||
|
||||
print(f"❌ [{count} / {total}] {new_url} is NOT accessible (original: {original_url})")
|
||||
cursor.execute("""UPDATE snapchat_stories SET status = 'inactive' WHERE id = %s""", (record_id,))
|
||||
db.commit()
|
||||
|
||||
cursor.close()
|
||||
db.close()
|
||||
@ -1,58 +0,0 @@
|
||||
from uuid import uuid4
|
||||
import uuid
|
||||
import os
|
||||
|
||||
def is_valid_uuid(uuid_to_test, version=4):
|
||||
try:
|
||||
uuid_obj = uuid.UUID(uuid_to_test, version=version)
|
||||
except ValueError:
|
||||
return False
|
||||
|
||||
return str(uuid_obj) == uuid_to_test
|
||||
|
||||
source_dir = 'tiktoks/'
|
||||
processed_dir = 'processed_tiktoks'
|
||||
|
||||
os.makedirs(processed_dir, exist_ok=True)
|
||||
|
||||
users = os.listdir(source_dir)
|
||||
|
||||
for user in users:
|
||||
user_dir = os.path.join(source_dir, user)
|
||||
if not os.path.isdir(user_dir):
|
||||
print(f"Skipping {user}")
|
||||
continue
|
||||
|
||||
for file in os.listdir(user_dir):
|
||||
filename = os.path.splitext(file)[0]
|
||||
filepath = os.path.join(user_dir, file)
|
||||
file_ext = os.path.splitext(file)[1]
|
||||
|
||||
tiktok_id = str(uuid4())
|
||||
username = user
|
||||
|
||||
if is_valid_uuid(filename):
|
||||
title = ''
|
||||
tiktok_id = filename
|
||||
elif 'masstik' in file or 'masstiktok' in file:
|
||||
data = file.split('_')
|
||||
title = filename.split('_')[-1]
|
||||
else:
|
||||
title = filename
|
||||
|
||||
|
||||
print("="*100)
|
||||
title = title.encode('utf-8', 'ignore').decode('utf-8')
|
||||
print(f"Username: {username}\nTitle: {title}")
|
||||
|
||||
new_filename = f"{username}~{title}~{tiktok_id}{file_ext}"
|
||||
new_filepath = os.path.join(processed_dir, username, new_filename)
|
||||
|
||||
os.makedirs(os.path.dirname(new_filepath), exist_ok=True)
|
||||
if not os.path.exists(new_filepath):
|
||||
os.rename(filepath, new_filepath)
|
||||
print(f"Renamed {file} to {new_filepath}")
|
||||
else:
|
||||
print("File with the same name already exists. Renaming aborted.")
|
||||
|
||||
print("="*100)
|
||||
Loading…
Reference in New Issue