fix: extract full text from note_tweet for long tweets (fixes #20)

Twitter long tweets (>280 chars) store full text in
note_tweet.note_tweet_results.result.text rather than legacy.full_text.
The parser now prioritizes note_tweet text when available.
This commit is contained in:
jackwener
2026-03-14 13:45:10 +08:00
parent 7de8ad0fbd
commit ce4326ef42
3 changed files with 14 additions and 1 deletions

View File

@@ -26,6 +26,9 @@ def test_parse_home_timeline_fixture(fixture_loader) -> None:
assert [tweet.id for tweet in tweets] == ["1", "20"]
assert cursor == "cursor-bottom-1"
assert tweets[0].media[0].type == "photo"
# note_tweet full text should be preferred over legacy.full_text for long tweets
assert "Show More" in tweets[0].text
assert tweets[0].text.startswith("Hello\nworld\n")
assert tweets[0].urls == ["https://example.com/post"]
assert tweets[1].is_retweet is True
assert tweets[1].retweeted_by == "bob"