Compare commits
No commits in common. "3f774a9e38c002488611d1760fd18a1d46a4ef5f" and "7a131ebd0340078aaaa557f4b35e8b34e081c19a" have entirely different histories.
3f774a9e38
...
7a131ebd03
|
@ -33,10 +33,10 @@ def feed():
|
||||||
except KeyboardInterrupt:
|
except KeyboardInterrupt:
|
||||||
raise
|
raise
|
||||||
except PRAWException as e:
|
except PRAWException as e:
|
||||||
logging.critical('Problem hitting reddit API: {}'.format(str(e)))
|
logging.error('Problem hitting reddit API: {}'.format(str(e)))
|
||||||
return []
|
return []
|
||||||
except PrawcoreException as e:
|
except PrawcoreException as e:
|
||||||
logging.critical('Problem hitting reddit API: {}'.format(str(e)))
|
logging.error('Problem hitting reddit API: {}'.format(str(e)))
|
||||||
return []
|
return []
|
||||||
|
|
||||||
def comment(i):
|
def comment(i):
|
||||||
|
@ -84,10 +84,10 @@ def story(ref):
|
||||||
except KeyboardInterrupt:
|
except KeyboardInterrupt:
|
||||||
raise
|
raise
|
||||||
except PRAWException as e:
|
except PRAWException as e:
|
||||||
logging.critical('Problem hitting reddit API: {}'.format(str(e)))
|
logging.error('Problem hitting reddit API: {}'.format(str(e)))
|
||||||
return False
|
return False
|
||||||
except PrawcoreException as e:
|
except PrawcoreException as e:
|
||||||
logging.critical('Problem hitting reddit API: {}'.format(str(e)))
|
logging.error('Problem hitting reddit API: {}'.format(str(e)))
|
||||||
return False
|
return False
|
||||||
|
|
||||||
# scratchpad so I can quickly develop the parser
|
# scratchpad so I can quickly develop the parser
|
||||||
|
|
|
@ -34,7 +34,7 @@ def api(route):
|
||||||
except KeyboardInterrupt:
|
except KeyboardInterrupt:
|
||||||
raise
|
raise
|
||||||
except BaseException as e:
|
except BaseException as e:
|
||||||
logging.critical('Problem hitting tildes website: {}'.format(str(e)))
|
logging.error('Problem hitting tildes website: {}'.format(str(e)))
|
||||||
return False
|
return False
|
||||||
|
|
||||||
def feed():
|
def feed():
|
||||||
|
@ -113,7 +113,7 @@ def story(ref):
|
||||||
|
|
||||||
# scratchpad so I can quickly develop the parser
|
# scratchpad so I can quickly develop the parser
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
print(feed())
|
#print(feed())
|
||||||
#normal = story('gxt')
|
#normal = story('gxt')
|
||||||
#print(normal)
|
#print(normal)
|
||||||
#no_comments = story('gxr')
|
#no_comments = story('gxr')
|
||||||
|
@ -122,8 +122,8 @@ if __name__ == '__main__':
|
||||||
#print(self_post)
|
#print(self_post)
|
||||||
#li_comment = story('gqx')
|
#li_comment = story('gqx')
|
||||||
#print(li_comment)
|
#print(li_comment)
|
||||||
#broken = story('q4y')
|
broken = story('q4y')
|
||||||
#print(broken)
|
print(broken)
|
||||||
|
|
||||||
# make sure there's no self-reference
|
# make sure there's no self-reference
|
||||||
#import copy
|
#import copy
|
||||||
|
|
|
@ -1,45 +0,0 @@
|
||||||
import logging
|
|
||||||
logging.basicConfig(
|
|
||||||
format='%(asctime)s - %(name)s - %(levelname)s - %(message)s',
|
|
||||||
level=logging.INFO)
|
|
||||||
|
|
||||||
import database
|
|
||||||
from sqlalchemy import select
|
|
||||||
import search
|
|
||||||
import sys
|
|
||||||
|
|
||||||
import json
|
|
||||||
import requests
|
|
||||||
|
|
||||||
database.init()
|
|
||||||
search.init()
|
|
||||||
|
|
||||||
def count_stories():
|
|
||||||
try:
|
|
||||||
session = database.Session()
|
|
||||||
return session.query(database.Story).count()
|
|
||||||
finally:
|
|
||||||
session.close()
|
|
||||||
|
|
||||||
def get_story_list():
|
|
||||||
try:
|
|
||||||
session = database.Session()
|
|
||||||
return session.query(database.Story.sid).all()
|
|
||||||
finally:
|
|
||||||
session.close()
|
|
||||||
|
|
||||||
if __name__ == '__main__':
|
|
||||||
num_stories = count_stories()
|
|
||||||
|
|
||||||
print('Reindex {} stories?'.format(num_stories))
|
|
||||||
print('Press ENTER to continue, ctrl-c to cancel')
|
|
||||||
input()
|
|
||||||
|
|
||||||
count = 1
|
|
||||||
for sid in get_story_list():
|
|
||||||
story = database.get_story(sid)
|
|
||||||
print('Indexing {}/{} id: {} title: {}'.format(count, num_stories, sid[0], story.title))
|
|
||||||
story_obj = json.loads(story.meta_json)
|
|
||||||
search.put_story(story_obj)
|
|
||||||
count += 1
|
|
||||||
|
|
|
@ -7,34 +7,51 @@ import requests
|
||||||
|
|
||||||
MEILI_URL = 'http://127.0.0.1:7700/'
|
MEILI_URL = 'http://127.0.0.1:7700/'
|
||||||
|
|
||||||
def meili_api(method, route, json=None, params=None):
|
def create_index():
|
||||||
try:
|
try:
|
||||||
r = method(MEILI_URL + route, json=json, params=params, timeout=4)
|
json = dict(name='qotnews', uid='qotnews')
|
||||||
if r.status_code > 299:
|
r = requests.post(MEILI_URL + 'indexes', json=json, timeout=2)
|
||||||
|
if r.status_code != 201:
|
||||||
raise Exception('Bad response code ' + str(r.status_code))
|
raise Exception('Bad response code ' + str(r.status_code))
|
||||||
return r.json()
|
return r.json()
|
||||||
except KeyboardInterrupt:
|
except KeyboardInterrupt:
|
||||||
raise
|
raise
|
||||||
except BaseException as e:
|
except BaseException as e:
|
||||||
logging.error('Problem with MeiliSearch api route: %s: %s', route, str(e))
|
logging.error('Problem creating MeiliSearch index: {}'.format(str(e)))
|
||||||
return False
|
return False
|
||||||
|
|
||||||
def create_index():
|
|
||||||
json = dict(uid='qotnews', primaryKey='id')
|
|
||||||
return meili_api(requests.post, 'indexes', json=json)
|
|
||||||
|
|
||||||
def update_rankings():
|
def update_rankings():
|
||||||
json = ['typo', 'words', 'proximity', 'attribute', 'desc(date)', 'wordsPosition', 'exactness']
|
try:
|
||||||
return meili_api(requests.post, 'indexes/qotnews/settings/ranking-rules', json=json)
|
json = ['typo', 'words', 'proximity', 'attribute', 'desc(date)', 'wordsPosition', 'exactness']
|
||||||
|
r = requests.post(MEILI_URL + 'indexes/qotnews/settings/ranking-rules', json=json, timeout=2)
|
||||||
|
if r.status_code != 202:
|
||||||
|
raise Exception('Bad response code ' + str(r.status_code))
|
||||||
|
return r.json()
|
||||||
|
except KeyboardInterrupt:
|
||||||
|
raise
|
||||||
|
except BaseException as e:
|
||||||
|
logging.error('Problem setting MeiliSearch ranking rules: {}'.format(str(e)))
|
||||||
|
return False
|
||||||
|
|
||||||
def update_attributes():
|
def update_attributes():
|
||||||
json = ['title', 'url', 'author', 'link', 'id']
|
try:
|
||||||
r = meili_api(requests.post, 'indexes/qotnews/settings/searchable-attributes', json=json)
|
json = ['title', 'url', 'author', 'link', 'id']
|
||||||
meili_api(requests.delete, 'indexes/qotnews/settings/displayed-attributes', json=json)
|
r = requests.post(MEILI_URL + 'indexes/qotnews/settings/searchable-attributes', json=json, timeout=2)
|
||||||
return r
|
if r.status_code != 202:
|
||||||
|
raise Exception('Bad response code ' + str(r.status_code))
|
||||||
|
return r.json()
|
||||||
|
r = requests.delete(MEILI_URL + 'indexes/qotnews/settings/displayed-attributes', timeout=2)
|
||||||
|
if r.status_code != 202:
|
||||||
|
raise Exception('Bad response code ' + str(r.status_code))
|
||||||
|
return r.json()
|
||||||
|
except KeyboardInterrupt:
|
||||||
|
raise
|
||||||
|
except BaseException as e:
|
||||||
|
logging.error('Problem setting MeiliSearch searchable attributes: {}'.format(str(e)))
|
||||||
|
return False
|
||||||
|
|
||||||
def init():
|
def init():
|
||||||
print(create_index())
|
create_index()
|
||||||
update_rankings()
|
update_rankings()
|
||||||
update_attributes()
|
update_attributes()
|
||||||
|
|
||||||
|
@ -42,14 +59,31 @@ def put_story(story):
|
||||||
story = story.copy()
|
story = story.copy()
|
||||||
story.pop('text', None)
|
story.pop('text', None)
|
||||||
story.pop('comments', None)
|
story.pop('comments', None)
|
||||||
return meili_api(requests.post, 'indexes/qotnews/documents', [story])
|
try:
|
||||||
|
r = requests.post(MEILI_URL + 'indexes/qotnews/documents', json=[story], timeout=2)
|
||||||
|
if r.status_code != 202:
|
||||||
|
raise Exception('Bad response code ' + str(r.status_code))
|
||||||
|
return r.json()
|
||||||
|
except KeyboardInterrupt:
|
||||||
|
raise
|
||||||
|
except BaseException as e:
|
||||||
|
logging.error('Problem putting MeiliSearch story: {}'.format(str(e)))
|
||||||
|
return False
|
||||||
|
|
||||||
def search(q):
|
def search(q):
|
||||||
params = dict(q=q, limit=250)
|
try:
|
||||||
r = meili_api(requests.get, 'indexes/qotnews/search', params=params)
|
params = dict(q=q, limit=250)
|
||||||
return r['hits']
|
r = requests.get(MEILI_URL + 'indexes/qotnews/search', params=params, timeout=2)
|
||||||
|
if r.status_code != 200:
|
||||||
|
raise Exception('Bad response code ' + str(r.status_code))
|
||||||
|
return r.json()['hits']
|
||||||
|
except KeyboardInterrupt:
|
||||||
|
raise
|
||||||
|
except BaseException as e:
|
||||||
|
logging.error('Problem searching MeiliSearch: {}'.format(str(e)))
|
||||||
|
return False
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
init()
|
create_index()
|
||||||
|
|
||||||
print(search('qot'))
|
print(search('the'))
|
||||||
|
|
|
@ -65,8 +65,6 @@ def submit():
|
||||||
url = request.form['url']
|
url = request.form['url']
|
||||||
nid = new_id()
|
nid = new_id()
|
||||||
|
|
||||||
logging.info('Manual submission: ' + url)
|
|
||||||
|
|
||||||
parse = urlparse(url)
|
parse = urlparse(url)
|
||||||
if 'news.ycombinator.com' in parse.hostname:
|
if 'news.ycombinator.com' in parse.hostname:
|
||||||
source = 'hackernews'
|
source = 'hackernews'
|
||||||
|
@ -202,7 +200,7 @@ def feed_thread():
|
||||||
except KeyboardInterrupt:
|
except KeyboardInterrupt:
|
||||||
logging.info('Ending feed thread...')
|
logging.info('Ending feed thread...')
|
||||||
except ValueError as e:
|
except ValueError as e:
|
||||||
logging.critical('feed_thread error: {} {}'.format(e.__class__.__name__, e))
|
logging.error('feed_thread error: {} {}'.format(e.__class__.__name__, e))
|
||||||
http_server.stop()
|
http_server.stop()
|
||||||
|
|
||||||
print('Starting Feed thread...')
|
print('Starting Feed thread...')
|
||||||
|
|
|
@ -3,7 +3,7 @@
|
||||||
Download MeiliSearch with:
|
Download MeiliSearch with:
|
||||||
|
|
||||||
```
|
```
|
||||||
wget https://github.com/meilisearch/MeiliSearch/releases/download/v0.21.1/meilisearch-linux-amd64
|
wget https://github.com/meilisearch/MeiliSearch/releases/download/v0.11.1/meilisearch-linux-amd64
|
||||||
chmod +x meilisearch-linux-amd64
|
chmod +x meilisearch-linux-amd64
|
||||||
```
|
```
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue
Block a user