Make fetch_inbox command respect the -n flag

This commit is contained in:
Alessio 2023-11-18 16:26:03 -08:00
parent 46eaf913fd
commit 520b9e366a
4 changed files with 100 additions and 14 deletions

View File

@ -160,7 +160,7 @@ func main() {
case "webserver": case "webserver":
start_webserver(*addr) start_webserver(*addr)
case "fetch_inbox": case "fetch_inbox":
fetch_inbox() fetch_inbox(*how_many)
default: default:
die(fmt.Sprintf("Invalid operation: %s", operation), true, 3) die(fmt.Sprintf("Invalid operation: %s", operation), true, 3)
} }
@ -398,8 +398,8 @@ func start_webserver(addr string) {
app.Run(addr) app.Run(addr)
} }
func fetch_inbox() { func fetch_inbox(how_many int) {
trove := scraper.GetInbox() trove := scraper.GetInbox(how_many)
profile.SaveDMTrove(trove) profile.SaveDMTrove(trove)
happy_exit(fmt.Sprintf("Saved %d messages from %d chats", len(trove.Messages), len(trove.Rooms))) happy_exit(fmt.Sprintf("Saved %d messages from %d chats", len(trove.Messages), len(trove.Rooms)))
} }

View File

@ -48,10 +48,18 @@ type APIDMConversation struct {
} }
type APIInbox struct { type APIInbox struct {
Status string `json:"status"`
MinEntryID int `json:"min_entry_id,string"`
LastSeenEventID int `json:"last_seen_event_id,string"` LastSeenEventID int `json:"last_seen_event_id,string"`
Cursor string `json:"cursor"` Cursor string `json:"cursor"`
Entries []struct { InboxTimelines struct {
Message APIDMMessage `json:"message"` Trusted struct {
Status string `json:"status"`
MinEntryID int `json:"min_entry_id,string"`
} `json:"trusted"`
} `json:"inbox_timelines"`
Entries []struct {
Message APIDMMessage `json:"message"`
} `json:"entries"` } `json:"entries"`
Users map[string]APIUser `json:"users"` Users map[string]APIUser `json:"users"`
Conversations map[string]APIDMConversation `json:"conversations"` Conversations map[string]APIDMConversation `json:"conversations"`
@ -59,20 +67,22 @@ type APIInbox struct {
type APIDMResponse struct { type APIDMResponse struct {
InboxInitialState APIInbox `json:"inbox_initial_state"` InboxInitialState APIInbox `json:"inbox_initial_state"`
InboxTimeline APIInbox `json:"inbox_timeline"`
} }
func (r APIDMResponse) ToDMTrove() DMTrove { func (r APIInbox) ToDMTrove() DMTrove {
ret := NewDMTrove() ret := NewDMTrove()
for _, entry := range r.InboxInitialState.Entries {
for _, entry := range r.Entries {
result := ParseAPIDMMessage(entry.Message) result := ParseAPIDMMessage(entry.Message)
ret.Messages[result.ID] = result ret.Messages[result.ID] = result
// TODO: parse Tweet attachments // TODO: parse Tweet attachments
} }
for _, room := range r.InboxInitialState.Conversations { for _, room := range r.Conversations {
result := ParseAPIDMChatRoom(room) result := ParseAPIDMChatRoom(room)
ret.Rooms[result.ID] = result ret.Rooms[result.ID] = result
} }
for _, u := range r.InboxInitialState.Users { for _, u := range r.Users {
result, err := ParseSingleUser(u) result, err := ParseSingleUser(u)
if err != nil { if err != nil {
panic(err) panic(err)
@ -82,7 +92,7 @@ func (r APIDMResponse) ToDMTrove() DMTrove {
return ret return ret
} }
func (api *API) GetDMInbox() (APIDMResponse, error) { func (api *API) GetDMInbox() (APIInbox, error) {
url, err := url.Parse("https://twitter.com/i/api/1.1/dm/inbox_initial_state.json") url, err := url.Parse("https://twitter.com/i/api/1.1/dm/inbox_initial_state.json")
if err != nil { if err != nil {
panic(err) panic(err)
@ -138,5 +148,66 @@ func (api *API) GetDMInbox() (APIDMResponse, error) {
var result APIDMResponse var result APIDMResponse
err = api.do_http(url.String(), "", &result) err = api.do_http(url.String(), "", &result)
return result, err result.InboxInitialState.Status = result.InboxInitialState.InboxTimelines.Trusted.Status
return result.InboxInitialState, err
}
func (api *API) GetInboxTrusted(oldest_id int) (APIInbox, error) {
url, err := url.Parse("https://twitter.com/i/api/1.1/dm/inbox_timeline/trusted.json")
if err != nil {
panic(err)
}
query := url.Query()
query.Add("max_id", fmt.Sprint(oldest_id))
query.Add("nsfw_filtering_enabled", "false")
query.Add("filter_low_quality", "true")
query.Add("include_quality", "all")
query.Add("include_profile_interstitial_type", "1")
query.Add("include_blocking", "1")
query.Add("include_blocked_by", "1")
query.Add("include_followed_by", "1")
query.Add("include_want_retweets", "1")
query.Add("include_mute_edge", "1")
query.Add("include_can_dm", "1")
query.Add("include_can_media_tag", "1")
query.Add("include_ext_has_nft_avatar", "1")
query.Add("include_ext_is_blue_verified", "1")
query.Add("include_ext_verified_type", "1")
query.Add("include_ext_profile_image_shape", "1")
query.Add("skip_status", "1")
query.Add("dm_secret_conversations_enabled", "false")
query.Add("krs_registration_enabled", "true")
query.Add("cards_platform", "Web-12")
query.Add("include_cards", "1")
query.Add("include_ext_alt_text", "true")
query.Add("include_ext_limited_action_results", "false")
query.Add("include_quote_count", "true")
query.Add("include_reply_count", "1")
query.Add("tweet_mode", "extended")
query.Add("include_ext_views", "true")
query.Add("dm_users", "true")
query.Add("include_groups", "true")
query.Add("include_inbox_timelines", "true")
query.Add("include_ext_media_color", "true")
query.Add("supports_reactions", "true")
query.Add("include_ext_edit_control", "true")
query.Add("ext", strings.Join([]string{
"mediaColor",
"altText",
"mediaStats",
"highlightedLabel",
"hasNftAvatar",
"voiceInfo",
"birdwatchPivot",
"enrichments",
"superFollowMetadata",
"unmentionInfo",
"editControl",
"vibe",
}, ","))
url.RawQuery = query.Encode()
var result APIDMResponse
err = api.do_http(url.String(), "", &result)
return result.InboxTimeline, err
} }

View File

@ -99,7 +99,7 @@ func TestParseInbox(t *testing.T) {
err = json.Unmarshal(data, &inbox) err = json.Unmarshal(data, &inbox)
require.NoError(t, err) require.NoError(t, err)
trove := inbox.ToDMTrove() trove := inbox.InboxInitialState.ToDMTrove()
for _, id := range []DMMessageID{1663623062195957773, 1663623203644751885, 1665922180176044037, 1665936253483614212} { for _, id := range []DMMessageID{1663623062195957773, 1663623203644751885, 1665922180176044037, 1665936253483614212} {
m, is_ok := trove.Messages[id] m, is_ok := trove.Messages[id]

View File

@ -28,7 +28,8 @@ func (t1 *DMTrove) MergeWith(t2 DMTrove) {
t1.TweetTrove.MergeWith(t2.TweetTrove) t1.TweetTrove.MergeWith(t2.TweetTrove)
} }
func GetInbox() DMTrove { // Returns a DMTrove and the cursor for the next update
func GetInbox(how_many int) (DMTrove, string) {
if !the_api.IsAuthenticated { if !the_api.IsAuthenticated {
log.Fatalf("Fetching DMs can only be done when authenticated. Please provide `--session [user]`") log.Fatalf("Fetching DMs can only be done when authenticated. Please provide `--session [user]`")
} }
@ -36,5 +37,19 @@ func GetInbox() DMTrove {
if err != nil { if err != nil {
panic(err) panic(err)
} }
return dm_response.ToDMTrove()
trove := dm_response.ToDMTrove()
cursor := dm_response.Cursor
next_cursor_id := dm_response.InboxTimelines.Trusted.MinEntryID
for len(trove.Rooms) < how_many && dm_response.Status != "AT_END" {
dm_response, err = the_api.GetInboxTrusted(next_cursor_id)
if err != nil {
panic(err)
}
next_trove := dm_response.ToDMTrove()
next_cursor_id = dm_response.MinEntryID
trove.MergeWith(next_trove)
}
return trove, cursor
} }