File size: 7,151 Bytes
7e4b742
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
from ..TikTokApi import TikTokApi

from ..TikTokApi.api.user import User
from ..TikTokApi.api.video import Video
import asyncio
import os
import json
from datetime import datetime
import math
ms_token = os.environ.get("ms_token", None) # get your own ms_token from your cookies on tiktok.com
maxvalue = 20
nowProcess = 0
def debug(debug: bool = False):
    if debug:
        os.environ["DEBUG"] = "True"
    else:
        os.environ["DEBUG"] = "False"
        
def openJson(path):
    try:
        with open(path, "r") as f:
            return json.loads(f.read())
    except:
        raise Exception("Error opening json file")
    
def saveJson(path, data):
    if not os.path.exists(os.path.dirname(path)):
        os.makedirs(os.path.dirname(path))
    with open(path, "w") as f:
        f.write(json.dumps(data))
        
def openTxt(path):
    try:
        with open(path, "r") as f:
            return f.read().splitlines()
    except:
        raise Exception("Error opening txt file")
    with open(path, "r") as f:
        return f.read().splitlines()
    
def saveTxt(path, data):
    if not os.path.exists(os.path.dirname(path)):
        os.makedirs(os.path.dirname(path))
    with open(path, "w") as f:
        f.write("\n".join(data))

def saveUserInfoInJson(username, data, hashtag = "default"):
    saveJson(f"Data/JSON/Users/{hashtag}/{username}.json", data)


def debugPrint(text):

    print(f"{datetime.now().strftime('%H:%M:%S.%f')}\t{text}")
        
        


async def users_videos_with_hashtag(usernameList, hashtag, blackList: dict[list] = None, ms_token: str = None):
    '''

    Asynchronous function that retrieves TikTok videos with a specific hashtag for a list of usernames, and saves the user's total views and total videos with the hashtag to a JSON file.

    

    Parameters:

    - `usernameList`: List of TikTok usernames to retrieve videos for.

    - `hashtag`: Hashtag to search for in the user's videos.

    - `blackList`: (Optional) Dictionary containing lists of usernames and video IDs to skip.

    - `ms_token`: (Optional) TikTok API access token.

        

    '''
    async with TikTokApi() as api:
        debugPrint("Creating sessions")
        
        await api.create_sessions(ms_tokens=[ms_token],
                                    num_sessions=1,
                                    sleep_after=20,
                                    headless=False,
                                    executable_path="C:/Program Files/Google/Chrome/Application/chrome.exe",
                                    #browser="firefox",
                                    override_browser_args=["--disable-blink-features=AutomationControlled"],
                                    
                                    #starting_url="https://anycoindirect.eu"
                                    )

        tasks   = [process_user(username=userName, api=api, hashtag=hashtag, blackList=blackList) for userName in usernameList]
        
        debugPrint("Sessions created")
        print(blackList.get("usernames", ""))
        await asyncio.gather(*tasks)
        {
        # async for username in usernameList:
            # if username in blackList.get("usernames", ""):
                # debugPrint(f"Skipping user {username} because it is in the blacklist")
                # continue
            # debugPrint(f"Getting user {username}")
            # debugPrint(f"username = {username}")
            # 
            # try:
                # 
                # user: User = api.user(username=username)
                # user_data = await user.info()
            # except:
                # print(f"Error getting user {username}")
                # continue
            # 
            # videosLen = user_data["userInfo"]["stats"]["videoCount"]
            # 
            # debugPrint(f"videosLen = {videosLen}")
            # total_views = 0
            # total_videos_with_tag  = 0
            # 
            # async for video in user.videos(count= videosLen):
                # if video.id in blackList.get("videos", []):
                    # continue
                # video: Video
                # play_count = int(video.stats.get("playCount", 0))
                # if any(str(h.name).lower() == hashtag for h in video.hashtags):
                    # total_views += play_count
                    # total_videos_with_tag += 1
            # 
            # saveUserInfoInJson(username=username,
                            #    data={
                                #    "username": username,
                                    # "total_views": total_views,
                                    # "total_videos_with_tag": total_videos_with_tag},
                                # hashtag=hashtag)
            # await asyncio.sleep(1)
            # 
        # 
        }
        await api.close_sessions()
        await api.stop_playwright()

async def process_user(username, api, hashtag, blackList):
    try:
        if username in blackList.get("usernames", ""):
            debugPrint(f"Skipping user {username} because it is in the blacklist")
            return
        debugPrint(f"Getting user {username}")
        debugPrint(f"username = {username}")
        
        try:
            
            user: User = api.user(username=username)
            user_data = await user.info()
        except:
            print(f"Error getting user {username}")
            return
        while nowProcess >= maxvalue:
            debugPrint(f"Waiting for {username}")
            await asyncio.sleep(1)
        nowProcess += 1
        videosLen = user_data["userInfo"]["stats"]["videoCount"]
        
        debugPrint(f"videosLen = {videosLen}")
        total_views = 0
        total_videos_with_tag  = 0
        
        async for video in user.videos(count= videosLen):
            if video.id in blackList.get("videos", []):
                continue
            video: Video
            play_count = int(video.stats.get("playCount", 0))
            if any(str(h.name).lower() == hashtag for h in video.hashtags):
                total_views += play_count
                total_videos_with_tag += 1
        debugPrint(f"save {username} {total_views}")
        saveUserInfoInJson(username=username,
                            data={
                                "username": username,
                                "total_views": total_views,
                                "total_videos_with_tag": total_videos_with_tag},
                            hashtag=hashtag)
    except:
        nowProcess -= 1
        print(f"Error getting user {username} !")
        return

if __name__ == "__main__":
    os.environ["DEBUG"] = "True"
    #print(os.environ.pop("DEBUG", False))
    usernameList = openTxt("Data/TXT/cacto0o.txt")
    hashtag = "костиккакто"
    blackList = openJson("Data/JSON/blackList.json")
    asyncio.run(users_videos_with_hashtag(usernameList=usernameList, hashtag=hashtag, blackList=blackList))