Spaces:

weanalyze
/

twitter_scraper

Runtime error

jiandong commited on Mar 13, 2023

Commit

887546c

1 Parent(s): 4a3a06a

Upload with huggingface_hub

Files changed (4) hide show

Dockerfile ADDED Viewed

+# read the doc: https://huggingface.co/docs/hub/spaces-sdks-docker
+# you will also find guides on how best to write your Dockerfile
+FROM python:3.8
+# Set up a new user named "user" with user ID 1000
+RUN useradd -m -u 1000 user
+# Switch to the "user" user
+USER user
+# Set home to the user's home directory
+ENV HOME=/home/user \
+	PATH=/home/user/.local/bin:$PATH
+# Set the working directory to the user's home directory
+WORKDIR $HOME/app
+# Copy the current directory contents into the container at $HOME/app setting the owner to the user
+COPY --chown=user . $HOME/app
+RUN pip install --no-cache-dir --upgrade -r $HOME/app/requirements.txt
+CMD ["workcell", "serve", "--config", "workcell.yaml", "--host", "0.0.0.0", "--port", "7860"]

app.py ADDED Viewed

+from tweety.bot import Twitter
+from pydantic import BaseModel, Field
+import pandas as pd
+from workcell.integrations.types import PerspectiveTable
+class Input(BaseModel):
+    username: str = Field(default="sama", description="Twitter username of the person you want to scrape")
+def fetch_twitter_by_id(username):
+    # app = Twitter("elonmusk")
+    app = Twitter(username)
+    # Get 20 Tweets of a user
+    all_tweets = app.get_tweets()
+    return all_tweets
+def process_tweets(tweets):
+    all_tweets = [tweet.to_dict() for tweet in tweets]
+    # pandas dataframe
+    df = pd.DataFrame(all_tweets)
+    # filter
+    filter_columns = ['created_on', 'text', 'likes','reply_counts', 'retweet_counts', 'id']
+    df = df[filter_columns]
+    return df
+def twitter_scraper(input: Input) -> PerspectiveTable:
+    """Returns latest 20 tweets of given usename, such as 'elonmusk'. """
+    all_tweets = fetch_twitter_by_id(username=input.username)
+    df = process_tweets(all_tweets)
+    return PerspectiveTable(data=df)

requirements.txt ADDED Viewed

workcell.yaml ADDED Viewed

+workcell_name: twitter_scraper
+workcell_provider: huggingface
+workcell_id: weanalyze/twitter_scraper
+workcell_version: latest
+workcell_runtime: python3.8
+workcell_entrypoint: app:twitter_scraper
+workcell_code:
+  ImageUri: ''
+workcell_tags: {}
+workcell_envs: {}