Skip to content

Workflow module

Source code in search_client/client.py
 19
 20
 21
 22
 23
 24
 25
 26
 27
 28
 29
 30
 31
 32
 33
 34
 35
 36
 37
 38
 39
 40
 41
 42
 43
 44
 45
 46
 47
 48
 49
 50
 51
 52
 53
 54
 55
 56
 57
 58
 59
 60
 61
 62
 63
 64
 65
 66
 67
 68
 69
 70
 71
 72
 73
 74
 75
 76
 77
 78
 79
 80
 81
 82
 83
 84
 85
 86
 87
 88
 89
 90
 91
 92
 93
 94
 95
 96
 97
 98
 99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
class SearchClient:

    BASE_URL: URL = URL(config.BASE_URL)

    def __init__(self, bearer_token: str) -> None:
        self.bearer_token = bearer_token
        self.headers = {"Authorization": f"Bearer {self.bearer_token}"}

    def get_users(
        self,
        usernames: list[str],
        expansions: list[str] | None = None,
        tweet_fields: list[str] | None = None,
        user_fields: list[str] | None = None,
    ) -> dict:
        """Get multiple user information by usernames.

        Args:
            usernames (list[str]):
                list of username strings to use for querying

            expansions (list[str] | None, optional):
                Check field_enums.Expansions for possible options. Defaults to None.

            tweet_fields (list[str] | None, optional):
                Check field_enums.Expansions for possible options. Defaults to None.

            user_fields (list[str] | None, optional):
                Check field_enums.Expansions for possible options. Defaults to None.

        Returns:
            dict: Raw dictionary containing the result of the query.
            "data" key will have the user info in form of list of dicts (this behaviour may change in the future)
        """
        url = SearchClient.BASE_URL / "users" / "by"
        fields = {
            "usernames": [usernames] if isinstance(usernames, str) else usernames,
            "tweet.fields": tweet_fields,
            "user.fields": user_fields,
            "expansions": expansions,
        }
        params = {k: ",".join(v) for k, v in fields.items() if v}
        response = requests.get(url, headers=self.headers, params=params)
        return response.json()

    def get_user(
        self,
        username: str,
        expansions: list[str] | None = None,
        tweet_fields: list[str] | None = None,
        user_fields: list[str] | None = None,
    ) -> dict:
        """Get single user information by username.

        Args:
            username (str):
                Username to use for querying.

            expansions (list[str] | None, optional):
                Check field_enums.Expansions for possible options. Defaults to None.

            tweet_fields (list[str] | None, optional):
                Tweet fields as defined by the Twitter API; only possible if user has a pinned tweet.
                Check field_enums.TweetFields for possible options. Defaults to None.

            user_fields (list[str] | None, optional):
                User fields as defined by the Twitter API. Check field_enums.UserFields for possible options. Defaults to None.

        Returns:
            dict: Raw dictionary containing the result of the query.
                "data" key will have the user info in form of dict (this behaviour may change in the future)
        """
        url = SearchClient.BASE_URL / "users" / "by" / "username" / username
        fields = {
            "tweet.fields": tweet_fields,
            "user.fields": user_fields,
            "expansions": expansions,
        }
        params = {k: ",".join(v) for k, v in fields.items() if v}
        response = requests.get(url, headers=self.headers, params=params)
        return response.json()

    def get_tweet_info(
        self,
        tweet_id: str | list[str],
        *,
        expansions: list[str] | None = None,
        media_fields: list[str] | None = None,
        place_fields: list[str] | None = None,
        poll_fields: list[str] | None = None,
        tweet_fields: list[str] | None = None,
        user_fields: list[str] | None = None,
    ) -> dict:
        url = SearchClient.BASE_URL / "tweets"

        fields = {
            "ids": [tweet_id] if isinstance(tweet_id, str) else tweet_id,
            "media.fields": media_fields,
            "place.fields": place_fields,
            "poll.fields": poll_fields,
            "tweet.fields": tweet_fields,
            "user.fields": user_fields,
            "expansions": expansions,
        }
        params = {k: ",".join(v) for k, v in fields.items() if v}
        response = requests.get(url, headers=self.headers, params=params)
        return response.json()

    def _get_tweet(
        self,
        query: list[str],
        *,
        max_results: int = 10,
        end_time: dt.datetime | None = None,
        start_time: dt.datetime | None = None,
        next_token: str | None = None,
        since_id: str | None = None,
        sort_order: str | None = None,
        until_id: str | None = None,
        expansions: list[str] | None = None,
        media_fields: list[str] | None = None,
        place_fields: list[str] | None = None,
        poll_fields: list[str] | None = None,
        tweet_fields: list[str] | None = None,
        user_fields: list[str] | None = None,
        archive: bool = False,
    ) -> dict:
        """
        Search recent tweets by separately providing query parameters.
        This method is meant to be lower-level and only abstracts making
        an actual HTTP request. Use `get_tweets` for simpler way.

        Example:
        >>> sc = SearchClient("your_bearer_token")  # make SearchCLient obj
        >>> sc.get_tweets(query=["tesla", "from:elonmusk"])
        <Gives you 10 recent tweets with keyword "tesla" from elonmusk>

        >>> sc.get_tweets(query=["bitcoin", "from:elonmusk"], max_results=20)
        <Gives you 20 recent tweets with keyword "bitcoin" from elonmusk>

        Each parameter is described in the official documentation for Twitter API
        https://developer.twitter.com/en/docs/twitter-api/tweets/search/api-reference/get-tweets-search-recent

        Building low-level queries can be complicated at first.
        Make sure to read through the link below for understanding.
        https://developer.twitter.com/en/docs/twitter-api/tweets/search/integrate/build-a-query
        """
        # preprocess query params
        query_val = " ".join(query)

        fields = {
            "media.fields": media_fields,
            "place.fields": place_fields,
            "poll.fields": poll_fields,
            "tweet.fields": tweet_fields,
            "user.fields": user_fields,
            "expansions": expansions,
        }
        field_params = {k: ",".join(v) for k, v in fields.items() if v}

        params = {
            **field_params,
            "query": query_val,
            "max_results": max_results,
            "end_time": end_time,
            "next_token": next_token,
            "since_id": since_id,
            "sort_order": sort_order,
            "start_time": start_time,
            "until_id": until_id,
        }
        url = SearchClient.BASE_URL / "tweets" / "search" / ("all" if archive else "recent")
        response = requests.get(url, params=params, headers=self.headers)
        return response.json()

    def get_tweets(
        self,
        query: list[str],
        number_of_tweets: int | None,
        *,
        start_time=None,
        end_time=None,
        archive=False,
    ) -> list[dict]:
        """Higher level method for fetching tweets using only query, number of tweets

        Args:
            query (list[str]):
                Query to Twitter API.

            number_of_tweets (int, optional):
                Number of tweets wanted by the user. 10 is the minimum.
                If `None`, return all tweets.

            start_time (_type_, optional):
                The oldest UTC timestamp from which the Tweets will be provided.
                By default, a request will return Tweets from up to 30 days ago if
                it is `None`. Timestamp is in second granularity and is inclusive
                (for example, 12:00:01 includes the first second of the minute).
                Defaults to None.

            end_time (_type_, optional):
                The newest, most recent UTC timestamp to which the Tweets will be
                provided. Timestamp is in second granularity and is exclusive
                (for example, 12:00:01 excludes the first second of the minute).
                If used without start_time, Tweets from 30 days before end_time
                will be returned by default. If not specified, end_time will
                default to [now - 30 seconds]. Defaults to None.

        Returns:
            list[dict]:
                Resulting list of tweets (dict). Each tweet dict will have:
                author_id, conversation_id, created_at, id, public_metrics, and text.
                Expansions and context annotations are not included.


        >>> from search_client.client import SearchClient
        >>> client = SearchClient("<your_token>")
        >>> client.get_tweets(query=["from:TwitterDev", "-is:retweet"])
        [{}, {...}]
        """
        assert number_of_tweets >= 10, "Number of tweets must be more than or equal to 10"
        params = {
            "max_results": 100,
            "end_time": end_time,
            "start_time": start_time,
            "next_token": None,
            # "media_fields": list(MediaFields),
            # "place_fields": list(PlaceFields),
            # "poll_fields": list(PollFields),
            "tweet_fields": [
                TweetFields.AUTHOR_ID,
                TweetFields.CONVERSATION_ID,
                TweetFields.PUBLIC_METRICS,
                TweetFields.IN_REPLY_TO_USER_ID,
                TweetFields.CREATED_AT,
            ],
            # "user_fields": list(UserFields),
        }

        if number_of_tweets is None:
            params["max_results"] = 100
        elif number_of_tweets < 100:
            params["max_results"] = max(10, number_of_tweets)

        tweets = []
        tweets_to_fetch = number_of_tweets
        while tweets_to_fetch is not None or tweets_to_fetch > 0:
            response = self._get_tweet(query, **params, archive=archive)
            meta = response.get("meta")

            if meta.get("result_count", 0) > 0:
                tweets_to_fetch -= meta.get("result_count")
                tweets.extend(response["data"])

            if tweets_to_fetch <= 0 or not meta.get("next_token"):
                break

            time.sleep(3.1)
            params["max_results"] = min(100, max(10, tweets_to_fetch))
            params["next_token"] = meta.get("next_token")

        return tweets

    def get_all_tweets(
        self,
        query: list[str],
        *,
        cooldown: float = 3,
        max_results: int = 10,
        end_time: dt.datetime | None = None,
        start_time: dt.datetime | None = None,
        next_token: str | None = None,
        since_id: str | None = None,
        sort_order: str | None = None,
        until_id: str | None = None,
        expansions: list[str] | None = None,
        media_fields: list[str] | None = None,
        place_fields: list[str] | None = None,
        poll_fields: list[str] | None = None,
        tweet_fields: list[str] | None = None,
        user_fields: list[str] | None = None,
        tweet_only: bool = False,
        max_page: int | None = 1,
    ) -> dict | list:
        result = []
        params = {
            "max_results": max_results,
            "end_time": end_time,
            "start_time": start_time,
            "next_token": next_token,
            "since_id": since_id,
            "sort_order": sort_order,
            "until_id": until_id,
            "expansions": expansions,
            "media_fields": media_fields,
            "place_fields": place_fields,
            "poll_fields": poll_fields,
            "tweet_fields": tweet_fields,
            "user_fields": user_fields,
        }

        while max_page is None or max_page > 0:
            tweets = self._get_tweet(query, **params, archive=True)

            if not tweets.get("data"):
                break

            if tweet_only:
                result.extend(tweets["data"])
            else:
                result.append(tweets)

            if max_page is not None:
                max_page -= 1

            params["next_token"] = tweets.get("meta").get("next_token")

            # check for max_page to eliminate waiting
            # when remaining page is 0 (max_page <= 0)
            if not params["next_token"] or (max_page is not None and max_page <= 0):
                break

            time.sleep(cooldown)

        return result

    def get_recent_tweets(
        self,
        query: list[str],
        *,
        cooldown: float = 3,
        max_results: int = 10,
        end_time: dt.datetime | None = None,
        start_time: dt.datetime | None = None,
        next_token: str | None = None,
        since_id: str | None = None,
        sort_order: str | None = None,
        until_id: str | None = None,
        expansions: list[str] | None = None,
        media_fields: list[str] | None = None,
        place_fields: list[str] | None = None,
        poll_fields: list[str] | None = None,
        tweet_fields: list[str] | None = None,
        user_fields: list[str] | None = None,
        tweet_only: bool = False,
        max_page: int | None = 1,
    ) -> dict | list:
        result = []
        params = {
            "max_results": max_results,
            "end_time": end_time,
            "start_time": start_time,
            "next_token": next_token,
            "since_id": since_id,
            "sort_order": sort_order,
            "until_id": until_id,
            "expansions": expansions,
            "media_fields": media_fields,
            "place_fields": place_fields,
            "poll_fields": poll_fields,
            "tweet_fields": tweet_fields,
            "user_fields": user_fields,
        }
        # tweets = self._get_tweet(query, **params, archive=False)

        while max_page is None or max_page > 0:
            tweets = self._get_tweet(query, **params, archive=False)

            if tweet_only:
                result.extend(tweets["data"])
            else:
                result.append(tweets)

            if max_page is not None:
                max_page -= 1

            params["next_token"] = tweets.get("meta").get("next_token")

            # check for max_page to eliminate waiting
            # when remaining page is 0 (max_page <= 0)
            if not params["next_token"] or (max_page is not None and max_page <= 0):
                break

            time.sleep(cooldown)

        return result

    def get_tweet_count_user(self, username: str, *, cooldown: float = 3) -> int:
        """Return total number of tweets from a user using username (twitter handle)

        Args:
            username (str): Twitter handle of the user ie username

        Returns:
            int: number of tweets they have tweeted since the creation of their account
        """
        url = SearchClient.BASE_URL / "tweets" / "counts" / "all"
        user = self.get_user(username, user_fields=[UserFields.CREATED_AT])
        query = f"from:{username}"
        start_time = user["data"]["created_at"]

        # we're subtracting 1 minute because end time must be less than 10 seconds
        # prior to the time the request was made according to Twitter API
        end_time = (dt.datetime.now(dt.timezone.utc) - dt.timedelta(minutes=1)).isoformat()
        params = {
            "query": query,
            "start_time": start_time,
            "end_time": end_time,
            "granularity": "day",
        }
        total = 0
        while True:
            response = requests.get(url, headers=self.headers, params=params)
            meta = response.json().get("meta")
            total += meta.get("total_tweet_count")
            next_token = meta.get("next_token")
            if next_token:
                params["next_token"] = next_token
                time.sleep(cooldown)
            else:
                break
        return total

    def get_tweet_count(
        self,
        query: list[str],
        *,
        end_time: dt.datetime | None = None,
        start_time: dt.datetime | None = None,
        next_token: str | None = None,
        since_id: str | None = None,
        until_id: str | None = None,
        cooldown: float = 3,
    ) -> int:
        params = {
            "query": " ".join(query),
            "end_time": end_time,
            "granularity": "day",
            "next_token": next_token,
            "since_id": since_id,
            "start_time": start_time,
            "until_id": until_id,
        }

        url = SearchClient.BASE_URL / "tweets" / "counts" / "all"

        total = 0
        while True:
            response = requests.get(url, headers=self.headers, params=params)
            meta = response.json().get("meta")
            total += meta.get("total_tweet_count")
            next_token = meta.get("next_token")
            if next_token:
                params["next_token"] = next_token
                time.sleep(cooldown)
            else:
                break
        return total

get_tweet_count_user(username, *, cooldown=3)

Return total number of tweets from a user using username (twitter handle)

Parameters:

Name Type Description Default
username str

Twitter handle of the user ie username

required

Returns:

Name Type Description
int int

number of tweets they have tweeted since the creation of their account

Source code in search_client/client.py
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
def get_tweet_count_user(self, username: str, *, cooldown: float = 3) -> int:
    """Return total number of tweets from a user using username (twitter handle)

    Args:
        username (str): Twitter handle of the user ie username

    Returns:
        int: number of tweets they have tweeted since the creation of their account
    """
    url = SearchClient.BASE_URL / "tweets" / "counts" / "all"
    user = self.get_user(username, user_fields=[UserFields.CREATED_AT])
    query = f"from:{username}"
    start_time = user["data"]["created_at"]

    # we're subtracting 1 minute because end time must be less than 10 seconds
    # prior to the time the request was made according to Twitter API
    end_time = (dt.datetime.now(dt.timezone.utc) - dt.timedelta(minutes=1)).isoformat()
    params = {
        "query": query,
        "start_time": start_time,
        "end_time": end_time,
        "granularity": "day",
    }
    total = 0
    while True:
        response = requests.get(url, headers=self.headers, params=params)
        meta = response.json().get("meta")
        total += meta.get("total_tweet_count")
        next_token = meta.get("next_token")
        if next_token:
            params["next_token"] = next_token
            time.sleep(cooldown)
        else:
            break
    return total

get_tweets(query, number_of_tweets, *, start_time=None, end_time=None, archive=False)

Higher level method for fetching tweets using only query, number of tweets

Parameters:

Name Type Description Default
query list[str]

Query to Twitter API.

required
number_of_tweets int

Number of tweets wanted by the user. 10 is the minimum. If None, return all tweets.

required
start_time _type_

The oldest UTC timestamp from which the Tweets will be provided. By default, a request will return Tweets from up to 30 days ago if it is None. Timestamp is in second granularity and is inclusive (for example, 12:00:01 includes the first second of the minute). Defaults to None.

None
end_time _type_

The newest, most recent UTC timestamp to which the Tweets will be provided. Timestamp is in second granularity and is exclusive (for example, 12:00:01 excludes the first second of the minute). If used without start_time, Tweets from 30 days before end_time will be returned by default. If not specified, end_time will default to [now - 30 seconds]. Defaults to None.

None

Returns:

Type Description
list[dict]

list[dict]: Resulting list of tweets (dict). Each tweet dict will have: author_id, conversation_id, created_at, id, public_metrics, and text. Expansions and context annotations are not included.

from search_client.client import SearchClient client = SearchClient("") client.get_tweets(query=["from:TwitterDev", "-is:retweet"]) [{}, {...}]

Source code in search_client/client.py
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
def get_tweets(
    self,
    query: list[str],
    number_of_tweets: int | None,
    *,
    start_time=None,
    end_time=None,
    archive=False,
) -> list[dict]:
    """Higher level method for fetching tweets using only query, number of tweets

    Args:
        query (list[str]):
            Query to Twitter API.

        number_of_tweets (int, optional):
            Number of tweets wanted by the user. 10 is the minimum.
            If `None`, return all tweets.

        start_time (_type_, optional):
            The oldest UTC timestamp from which the Tweets will be provided.
            By default, a request will return Tweets from up to 30 days ago if
            it is `None`. Timestamp is in second granularity and is inclusive
            (for example, 12:00:01 includes the first second of the minute).
            Defaults to None.

        end_time (_type_, optional):
            The newest, most recent UTC timestamp to which the Tweets will be
            provided. Timestamp is in second granularity and is exclusive
            (for example, 12:00:01 excludes the first second of the minute).
            If used without start_time, Tweets from 30 days before end_time
            will be returned by default. If not specified, end_time will
            default to [now - 30 seconds]. Defaults to None.

    Returns:
        list[dict]:
            Resulting list of tweets (dict). Each tweet dict will have:
            author_id, conversation_id, created_at, id, public_metrics, and text.
            Expansions and context annotations are not included.


    >>> from search_client.client import SearchClient
    >>> client = SearchClient("<your_token>")
    >>> client.get_tweets(query=["from:TwitterDev", "-is:retweet"])
    [{}, {...}]
    """
    assert number_of_tweets >= 10, "Number of tweets must be more than or equal to 10"
    params = {
        "max_results": 100,
        "end_time": end_time,
        "start_time": start_time,
        "next_token": None,
        # "media_fields": list(MediaFields),
        # "place_fields": list(PlaceFields),
        # "poll_fields": list(PollFields),
        "tweet_fields": [
            TweetFields.AUTHOR_ID,
            TweetFields.CONVERSATION_ID,
            TweetFields.PUBLIC_METRICS,
            TweetFields.IN_REPLY_TO_USER_ID,
            TweetFields.CREATED_AT,
        ],
        # "user_fields": list(UserFields),
    }

    if number_of_tweets is None:
        params["max_results"] = 100
    elif number_of_tweets < 100:
        params["max_results"] = max(10, number_of_tweets)

    tweets = []
    tweets_to_fetch = number_of_tweets
    while tweets_to_fetch is not None or tweets_to_fetch > 0:
        response = self._get_tweet(query, **params, archive=archive)
        meta = response.get("meta")

        if meta.get("result_count", 0) > 0:
            tweets_to_fetch -= meta.get("result_count")
            tweets.extend(response["data"])

        if tweets_to_fetch <= 0 or not meta.get("next_token"):
            break

        time.sleep(3.1)
        params["max_results"] = min(100, max(10, tweets_to_fetch))
        params["next_token"] = meta.get("next_token")

    return tweets

get_user(username, expansions=None, tweet_fields=None, user_fields=None)

Get single user information by username.

Parameters:

Name Type Description Default
username str

Username to use for querying.

required
expansions list[str] | None

Check field_enums.Expansions for possible options. Defaults to None.

None
tweet_fields list[str] | None

Tweet fields as defined by the Twitter API; only possible if user has a pinned tweet. Check field_enums.TweetFields for possible options. Defaults to None.

None
user_fields list[str] | None

User fields as defined by the Twitter API. Check field_enums.UserFields for possible options. Defaults to None.

None

Returns:

Name Type Description
dict dict

Raw dictionary containing the result of the query. "data" key will have the user info in form of dict (this behaviour may change in the future)

Source code in search_client/client.py
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
def get_user(
    self,
    username: str,
    expansions: list[str] | None = None,
    tweet_fields: list[str] | None = None,
    user_fields: list[str] | None = None,
) -> dict:
    """Get single user information by username.

    Args:
        username (str):
            Username to use for querying.

        expansions (list[str] | None, optional):
            Check field_enums.Expansions for possible options. Defaults to None.

        tweet_fields (list[str] | None, optional):
            Tweet fields as defined by the Twitter API; only possible if user has a pinned tweet.
            Check field_enums.TweetFields for possible options. Defaults to None.

        user_fields (list[str] | None, optional):
            User fields as defined by the Twitter API. Check field_enums.UserFields for possible options. Defaults to None.

    Returns:
        dict: Raw dictionary containing the result of the query.
            "data" key will have the user info in form of dict (this behaviour may change in the future)
    """
    url = SearchClient.BASE_URL / "users" / "by" / "username" / username
    fields = {
        "tweet.fields": tweet_fields,
        "user.fields": user_fields,
        "expansions": expansions,
    }
    params = {k: ",".join(v) for k, v in fields.items() if v}
    response = requests.get(url, headers=self.headers, params=params)
    return response.json()

get_users(usernames, expansions=None, tweet_fields=None, user_fields=None)

Get multiple user information by usernames.

Parameters:

Name Type Description Default
usernames list[str]

list of username strings to use for querying

required
expansions list[str] | None

Check field_enums.Expansions for possible options. Defaults to None.

None
tweet_fields list[str] | None

Check field_enums.Expansions for possible options. Defaults to None.

None
user_fields list[str] | None

Check field_enums.Expansions for possible options. Defaults to None.

None

Returns:

Name Type Description
dict dict

Raw dictionary containing the result of the query.

dict

"data" key will have the user info in form of list of dicts (this behaviour may change in the future)

Source code in search_client/client.py
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
def get_users(
    self,
    usernames: list[str],
    expansions: list[str] | None = None,
    tweet_fields: list[str] | None = None,
    user_fields: list[str] | None = None,
) -> dict:
    """Get multiple user information by usernames.

    Args:
        usernames (list[str]):
            list of username strings to use for querying

        expansions (list[str] | None, optional):
            Check field_enums.Expansions for possible options. Defaults to None.

        tweet_fields (list[str] | None, optional):
            Check field_enums.Expansions for possible options. Defaults to None.

        user_fields (list[str] | None, optional):
            Check field_enums.Expansions for possible options. Defaults to None.

    Returns:
        dict: Raw dictionary containing the result of the query.
        "data" key will have the user info in form of list of dicts (this behaviour may change in the future)
    """
    url = SearchClient.BASE_URL / "users" / "by"
    fields = {
        "usernames": [usernames] if isinstance(usernames, str) else usernames,
        "tweet.fields": tweet_fields,
        "user.fields": user_fields,
        "expansions": expansions,
    }
    params = {k: ",".join(v) for k, v in fields.items() if v}
    response = requests.get(url, headers=self.headers, params=params)
    return response.json()