-
Notifications
You must be signed in to change notification settings - Fork 18
/
Copy pathmigrate.py
58 lines (48 loc) · 1.71 KB
/
migrate.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
import base64
from datetime import timezone
from dateutil import parser
from elasticsearch.client import Elasticsearch
from elasticsearch.helpers import scan
from controller.smartapi import SmartAPI
from utils import decoder, indices
ES_ORIGIN = "http://smart-api.info:9200"
ES_DESTINATION = "http://localhost:9200" # CANNOT CHANGE THIS
def migrate():
for doc in scan(
Elasticsearch(ES_ORIGIN),
query={"query": {"match_all": {}}},
index="smartapi_oas3",
doc_type="api",
):
print(doc["_id"])
if not doc["_source"]["_meta"].get("_archived"):
url = doc["_source"]["_meta"]["url"]
raw = decoder.decompress(base64.urlsafe_b64decode(doc["_source"]["~raw"]))
smartapi = SmartAPI(url)
smartapi.raw = raw
smartapi.date_created = parser.parse(doc["_source"]["_meta"]["timestamp"]).replace(tzinfo=timezone.utc)
smartapi.username = doc["_source"]["_meta"]["github_username"]
smartapi.slug = doc["_source"]["_meta"].get("slug")
smartapi.save()
print()
def update():
for doc in scan(
Elasticsearch(ES_DESTINATION),
query={"query": {"match_all": {}}},
index="smartapi_docs",
scroll="60m",
):
print(doc["_id"])
smartapi = SmartAPI.get(doc["_id"])
print(smartapi.check())
print(smartapi.refresh())
if smartapi.webdoc.status == 299:
smartapi.webdoc._status = 200 # change status not reliable during migration
smartapi.save()
print()
if __name__ == "__main__":
input("Will reset smartapi_docs index. Ctrl-C to cancel.")
indices.reset()
migrate()
indices.refresh()
update()