2017-04-04 20:12:45 +02:00
import praw
2022-04-04 17:49:57 +01:00
import json
2022-04-05 11:55:45 +01:00
import time
2022-04-08 11:19:46 +07:00
import re
2022-04-06 16:47:46 -03:00
import os
2022-04-08 06:52:00 +07:00
import traceback
2022-04-08 11:19:46 +07:00
from formatter import format_all
2017-04-04 20:12:45 +02:00
2022-04-05 14:15:30 +03:00
outfile = open ( ' temp_atlas.json ' , ' w ' , encoding = ' utf-8 ' )
2022-04-10 21:34:06 +07:00
editidsfile = open ( ' read-ids-temp.txt ' , ' w ' )
2022-04-05 14:15:30 +03:00
failfile = open ( ' manual_atlas.json ' , ' w ' , encoding = ' utf-8 ' )
2017-04-04 20:12:45 +02:00
2022-04-08 10:59:06 +07:00
with open ( ' credentials ' , ' r ' ) as file :
credentials = file . readlines ( )
client_id = credentials [ 0 ] . strip ( )
client_secret = credentials [ 1 ] . strip ( )
2022-04-08 22:57:33 +07:00
username = credentials [ 2 ] . strip ( ) if len ( credentials ) > 3 else " "
password = credentials [ 3 ] . strip ( ) if len ( credentials ) > 3 else " "
2022-04-08 10:59:06 +07:00
reddit = praw . Reddit (
client_id = client_id ,
client_secret = client_secret ,
username = username ,
password = password ,
user_agent = ' atlas_bot '
)
has_write_access = not reddit . read_only
if not has_write_access :
print ( " Warning: No write access. Post flairs will not be updated. " )
time . sleep ( 5 )
2022-04-07 12:01:09 +07:00
2022-04-05 11:25:12 +01:00
existing_ids = [ ]
2022-04-10 21:34:06 +07:00
with open ( ' ../data/edit-ids.txt ' , ' r ' ) as edit_ids_file :
for id in [ x . strip ( ) for x in edit_ids_file . readlines ( ) ] :
existing_ids . append ( id )
2022-04-05 11:25:12 +01:00
2022-04-08 10:59:06 +07:00
def set_flair ( submission , flair ) :
if has_write_access and submission . link_flair_text != flair :
flair_choices = submission . flair . choices ( )
flair = next ( x for x in flair_choices if x [ " flair_text_editable " ] and flair == x [ " flair_text " ] )
submission . flair . select ( flair [ " flair_template_id " ] )
2022-04-06 16:47:46 -03:00
total_all_flairs = 0
duplicate_count = 0
2022-04-08 11:19:46 +07:00
failcount = 0
successcount = 0
totalcount = 0
2022-04-06 16:47:46 -03:00
outfile . write ( " [ \n " )
2022-04-05 20:57:08 +01:00
for submission in reddit . subreddit ( ' placeAtlas2 ' ) . new ( limit = 2000 ) :
2022-04-04 19:02:15 +01:00
"""
Auth setup
1. Head to https : / / www . reddit . com / prefs / apps
2. Click " create another app "
3. Give it a name and description
4. Select " script "
5. Redirect to http : / / localhost : 8080
2022-04-08 11:09:35 +07:00
6. Create file " credentials " with the format below .
┌ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ┐
│ [ ID ] < - Under " personal use script " │
│ [ Secret ] │
│ [ Username ] < - Must be a mod , don ' t do this if you │
│ [ Password ] < - don ' t know what you are doing. │
└ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ─ ┘
7. Run Script
2022-04-04 19:02:15 +01:00
Running Script
1. Input the next ID to use
2. Manually resolve errors in manual_atlas . json
3. Copy temp_atlas . json entries into web / _js / atlas . js
4. Pull Request
"""
2022-04-06 16:47:46 -03:00
total_all_flairs + = 1
2022-04-07 12:01:09 +07:00
2022-04-05 11:55:45 +01:00
if ( submission . id in existing_ids ) :
2022-04-08 11:19:46 +07:00
set_flair ( submission , " Processed Entry " )
2022-04-05 13:47:36 +01:00
print ( " Found first duplicate! " )
2022-04-06 16:47:46 -03:00
duplicate_count + = 1
2022-04-08 11:19:46 +07:00
if ( duplicate_count > 0 ) :
2022-04-06 16:47:46 -03:00
break
else :
continue
2022-04-07 12:01:09 +07:00
2022-04-08 10:59:06 +07:00
if ( submission . link_flair_text == " New Entry " ) :
2022-04-07 12:01:09 +07:00
2022-04-05 08:39:51 +01:00
try :
2022-04-07 21:22:41 +07:00
text = submission . selftext
2022-04-08 06:52:00 +07:00
rawtext = text
2022-04-08 11:01:51 +07:00
text = text . replace ( ' \u200c ' , ' ' )
2022-04-08 06:52:00 +07:00
text = re . compile ( r " .*( \ { .+ \ }).* " , re . DOTALL ) . search ( text ) . group ( 1 )
2022-04-08 07:28:20 +07:00
# Test if it needs to escape the escape character. Usually happens on fancy mode.
try : json . loads ( text )
except json . JSONDecodeError : text = re . sub ( r " \\ (.) " , r " \ 1 " , text )
2022-04-08 06:52:00 +07:00
2022-04-07 12:01:09 +07:00
submission_json = json . loads ( text )
2017-04-05 02:53:39 +02:00
2022-04-07 21:22:41 +07:00
if submission_json :
2017-04-05 02:53:39 +02:00
2022-04-07 21:22:41 +07:00
submission_json_dummy = { " id " : submission . id , " submitted_by " : " " }
try :
submission_json_dummy [ " submitted_by " ] = submission . author . name
except AttributeError :
submission_json_dummy [ " submitted_by " ] = " unknown "
for key in submission_json :
if not key in submission_json_dummy :
submission_json_dummy [ key ] = submission_json [ key ] ;
2022-04-08 18:04:49 +07:00
( submission_json , validation_status ) = format_all ( submission_json_dummy , True )
assert validation_status < 3 , \
" Submission invalid after validation. This may be caused by not enough points on the path. "
2022-04-08 21:17:16 +07:00
outfile . write ( json . dumps ( submission_json , ensure_ascii = False ) + " , \n " )
2022-04-10 21:34:06 +07:00
editidsfile . write ( submission . id + ' \n ' )
2022-04-07 21:22:41 +07:00
successcount + = 1
2022-04-08 10:59:06 +07:00
set_flair ( submission , " Processed Entry " )
2022-04-07 21:22:41 +07:00
except Exception as e :
2022-04-08 06:52:00 +07:00
failfile . write (
" \n \n " + " = " * 40 + " \n \n " +
submission . id + " \n \n " +
traceback . format_exc ( ) + " \n \n " +
2022-04-08 10:13:12 +07:00
" ==== RAW ==== " + " \n \n " +
rawtext + " \n \n "
" ==== CLEAN ==== " + " \n \n " +
text + " \n \n "
2022-04-08 06:52:00 +07:00
)
2022-04-07 21:22:41 +07:00
failcount + = 1
2022-04-08 10:59:06 +07:00
set_flair ( submission , " Rejected Entry " )
2022-04-07 12:01:09 +07:00
2022-04-08 10:59:06 +07:00
print ( " Wrote " + submission . id + " , submitted " + str ( round ( time . time ( ) - submission . created_utc ) ) + " seconds ago " )
2022-04-05 22:33:57 -03:00
totalcount + = 1
2022-04-04 17:49:57 +01:00
2022-04-08 10:14:49 +07:00
# Remove last trailing comma
outfile . seek ( outfile . tell ( ) - 3 , os . SEEK_SET )
2022-04-06 16:47:46 -03:00
outfile . truncate ( )
outfile . write ( " \n ] " )
print ( f " \n \n Total all flairs: { total_all_flairs } \n Success: { successcount } / { totalcount } \n Fail: { failcount } / { totalcount } \n Please check manual_atlas.txt for failed entries to manually resolve. " )