diff --git a/couchDB/.gitkeep b/couchDB/.gitkeep new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/couchDB/MapReduce/.gitkeep b/couchDB/MapReduce/.gitkeep new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/couchDB/MapReduce/map.js b/couchDB/MapReduce/map.js new file mode 100644 index 0000000000000000000000000000000000000000..02ba2578edc8389b104fc22ccf5667cda70802d3 --- /dev/null +++ b/couchDB/MapReduce/map.js @@ -0,0 +1,25 @@ +function (doc) { + var editDate = new Date(doc.created_at.split(" ")[0]); + var month = editDate.getMonth()+1; + var year = editDate.getFullYear(); + var date = editDate.getDate(); + + if(year==2020){ + + if(date<=10){ + stage='F' + } + else if(date<=20){ + stage='M' + } + else{ + stage='L' + } + if(doc.sentiment[0]<0) + emit([doc.state,'negative',month,stage],1) + else if(doc.sentiment[0]>0) + emit([doc.state,'positive',month,stage],1) + else + emit([doc.state,'neutral',month,stage],1) + +}} \ No newline at end of file diff --git a/couchDB/MapReduce/reduce.js b/couchDB/MapReduce/reduce.js new file mode 100644 index 0000000000000000000000000000000000000000..79f412b762355329a84537e489f9185e8a914d2e --- /dev/null +++ b/couchDB/MapReduce/reduce.js @@ -0,0 +1 @@ +_sum \ No newline at end of file diff --git a/couchDB/process.py b/couchDB/process.py new file mode 100644 index 0000000000000000000000000000000000000000..e9ea86dfc056d8a4b9a0bae4b52fcc667b8dec26 --- /dev/null +++ b/couchDB/process.py @@ -0,0 +1,39 @@ +import io +import json +from datetime import datetime +import re +from textblob import TextBlob + + +file1='tweetsWA.json' + +output_file=io.open('extractedWA.json','w') + +count=1 + +remove_ms = lambda x:re.sub("\+\d+\s","",x) +mk_dt = lambda x:datetime.strptime(remove_ms(x), "%a %b %d %H:%M:%S %Y") +my_date = lambda x:"{:%Y-%m-%d}".format(mk_dt(x)) +my_time = lambda x:"{:%H:%M:%S}".format(mk_dt(x)) + +with io.open(file1,'r',encoding="utf-8") as f: + for line in f: + try: + my_dict={} + my_dict['id']=json.loads(line)['id'] + create_time=json.loads(line)['created_at'] + my_dict['date']=my_date(create_time) + my_dict['time']=my_time(create_time) + tweet = json.loads(line)['text'] + my_dict['polarity']=TextBlob(tweet).sentiment.polarity + my_dict['lang'] = json.loads(line)['lang'] + output_file.write(json.dumps(my_dict)+',\n') + except: + pass + +output_file.close() + + + + + diff --git a/couchDB/try-couchdb.py b/couchDB/try-couchdb.py new file mode 100644 index 0000000000000000000000000000000000000000..8848237459a66c0b254f3982e7faa5b2bc7269a9 --- /dev/null +++ b/couchDB/try-couchdb.py @@ -0,0 +1,11 @@ +import couchdb +import json +couch = couchdb.Server('http://127.0.0.1:5984') +couch.resource.credentials = ("admin", "960115") +if 'tweets' not in couch: + db = couch.create('tweets') +db = couch['tweets'] +with open('tweetsWA.json',encoding='utf-8') as jsonfile: + for row in jsonfile: + db_entry = json.loads(row) + db.save(db_entry) \ No newline at end of file diff --git a/couchDB/uploadAurin.py b/couchDB/uploadAurin.py new file mode 100644 index 0000000000000000000000000000000000000000..a60ae499bb4928702e833ae557b866d74c86031a --- /dev/null +++ b/couchDB/uploadAurin.py @@ -0,0 +1,17 @@ +import couchdb +import json + +couch = couchdb.Server('http://172.26.133.58:5984') +couch.resource.credentials = ("admin", "admin") +if 'housing-sa4' not in couch: + db = couch.create('housing-sa4') +db = couch['housing-sa4'] + +json_data = json.load(open('vic1.json')) +for feature in json_data['features']: + db.save(feature) + + + + +