DRAE-MLP
diff --git a/‎label_tweet.ipynb
+20-18 b/‎label_tweet.ipynb
+20-18
@@ -16,7 +16,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": 3,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -31,14 +31,11 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 4,
    "metadata": {},
    "outputs": [],
    "source": [
-    "df = pd.read_csv(\"G:/Shared drives/Unidad Compartida Pachitos/Data Science Projects Pachitos/HackOff-CompanySentiments/archive (2)/Tweets.csv\")\n",
-    "df.drop(['tweet_id','airline_sentiment_confidence','negativereason','negativereason_confidence','airline_sentiment_gold','name','negativereason_gold','retweet_count',\n",
-    "'tweet_coord','tweet_created','tweet_location','user_timezone','airline'], axis = 1, inplace = True)\n",
-    "df = df.rename(columns = {'airline_sentiment':'original'})"
+    "#df = pd.read_csv(\"G:/Shared drives/Unidad Compartida Pachitos/Data Science Projects Pachitos/HackOff-CompanySentiments/tesla_sf.csv\")"
    ]
   },
   {
@@ -47,14 +44,13 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "#data_location = 's3://tweets-hackoff2/Tweets.csv'\n",
-    "#df = pd.read_csv(data_location)\n",
-    "#df"
+    "data_location = 's3://tweets-hackoff2/tesla_sf.csv'\n",
+    "df = pd.read_csv(data_location)"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": 6,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -89,7 +85,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 6,
+   "execution_count": 7,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -98,18 +94,18 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
+   "execution_count": 8,
    "metadata": {},
    "outputs": [
     {
      "output_type": "execute_result",
      "data": {
       "text/plain": [
-       "<__main__.SentimentAnalysisTweets at 0x1e7c26cd2c8>"
+       "<__main__.SentimentAnalysisTweets at 0x20e6cf84188>"
       ]
      },
      "metadata": {},
-     "execution_count": 7
+     "execution_count": 8
     }
    ],
    "source": [
@@ -118,12 +114,12 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 8,
+   "execution_count": 14,
    "metadata": {},
    "outputs": [],
    "source": [
-    "df_label = pd.DataFrame()\n",
-    "df_label['text'] = tweet_class.tweets_.loc[(tweet_class.tweets_['flag'] == 'negative'),'text']\n",
+    "df_label = tweet_class.tweets_.copy()\n",
+    "df_label.drop(['tweets_clean','sentiment'], axis=1, inplace=True)\n",
     "df_label.to_csv('label_tweets.csv', index=False)"
    ]
   },
@@ -132,7 +128,13 @@
    "execution_count": null,
    "metadata": {},
    "outputs": [],
-   "source": []
+   "source": [
+    "# instantiate S3 client and upload to s3\n",
+    "import boto3\n",
+    "\n",
+    "s3 = boto3.resource('s3')\n",
+    "s3.meta.client.upload_file('label_tweets.csv', 'tweets-hackoff', 'DESIRED_S3_OBJECT_NAME')"
+   ]
   }
  ],
  "metadata": {