diff --git a/LICENSE b/LICENSE new file mode 100644 index 0000000..a12bd41 --- /dev/null +++ b/LICENSE @@ -0,0 +1,21 @@ +MIT License + +Copyright (c) 2022 COMP90024-2022 Group 52 + +Permission is hereby granted, free of charge, to any person obtaining a copy +of this software and associated documentation files (the "Software"), to deal +in the Software without restriction, including without limitation the rights +to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +copies of the Software, and to permit persons to whom the Software is +furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. diff --git a/README.md b/README.md index 8e69bae..be12dc2 100644 --- a/README.md +++ b/README.md @@ -1,2 +1,51 @@ # COMP90024-Cluster-and-Cloud-Computing-Assignment-2 - Cluster & Cloud Computing, Twitter analyzer + +## Introduction +The focus of this project is toharvest tweets from Melbourne on the MRC and undertake a variety of social media data analytics +scenarios that explore liveability of Melbourne and importantly how the Twitter data can be used +alongside/compared with/augment the data available within the AURIN platform to improve our +knowledge of the liveability of Melbourne + +This project is a Cloud-based solution that exploits a multitude of virtual machines (VMs) +across the MRC for harvesting tweets through the Twitter APIs (using both the Streaming and the +Search API interfaces). + +We have produce a solution that can be run (in principle) across any node of the MRC to +harvest and store tweets and scale up/down as required. The solution includes multiple +Twitter harvesting applications for Melbourne, These harvesting application running on +the MRC together with an associated CouchDB database containing the amalgamated collection +of Tweets. The CouchDB setup is based on a cluster setup. + +## Tech stack +- Python + Flask +- Tweepy +- CouchDB +- React.js +- Docker +- Nginx +- NLTK + TextBlob + +## License +``` +MIT License + +Copyright (c) 2022 COMP90024-2022 Group 52 + +Permission is hereby granted, free of charge, to any person obtaining a copy +of this software and associated documentation files (the "Software"), to deal +in the Software without restriction, including without limitation the rights +to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +copies of the Software, and to permit persons to whom the Software is +furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. +``` diff --git a/aurin_helper/config/config.py b/aurin_helper/config/config.py index 8824339..c52943a 100644 --- a/aurin_helper/config/config.py +++ b/aurin_helper/config/config.py @@ -175,7 +175,7 @@ 'sep_21': 'un_rate_2021_9' } -EMPLOYMENT_PATH = '/data/Aurin/Employ/unemployment.csv' +EMPLOYMENT_PATH = '/data/Aurin/Employ/employment.csv' EMPLOYMENT_INFO = { 'mar_19': 'num_2019_3', 'jun_19': 'num_2019_6', diff --git a/backend/upload_design_doc.py b/backend/upload_design_doc.py index 382e17b..a0d621d 100644 --- a/backend/upload_design_doc.py +++ b/backend/upload_design_doc.py @@ -255,7 +255,7 @@ if response.status_code != 201: print('Error uploading') - for each in cfg.get_twitter_dbs: + for each in cfg.get_twitter_dbs(): response = requests.put( req_link.format(db=each, design_doc='languages'), headers={"Content-Type": "application/json"}, @@ -264,4 +264,4 @@ if response.status_code != 201: print('Error uploading') - \ No newline at end of file +