{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":180136168,"defaultBranch":"master","name":"trafilatura","ownerLogin":"adbar","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2019-04-08T11:38:48.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/2125866?v=4","public":true,"private":false,"isOrgOwned":false},"refInfo":{"name":"","listCacheKey":"v0:1716559304.0","currentOid":""},"activityList":{"items":[{"before":"28793934248a84fccd285b05f1e6367033f8b7ba","after":"0170a9faff634f92204b63c02b2a5f56c11e2482","ref":"refs/heads/master","pushedAt":"2024-05-24T14:01:44.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"CLI file processing fixes: options, mtime and tests (#605)\n\n* CLI fixes: file processing options, mtime, and tests\r\n\r\n* use stat for efficiency","shortMessageHtmlLink":"CLI file processing fixes: options, mtime and tests (#605)"}},{"before":"01021a75fb477dc82b2ec92ab1df22a311ce18c8","after":null,"ref":"refs/heads/fix_cli_fileproc","pushedAt":"2024-05-24T14:01:44.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"}},{"before":"ce0bca085cea27b33b8271853a1325efac61556e","after":"01021a75fb477dc82b2ec92ab1df22a311ce18c8","ref":"refs/heads/fix_cli_fileproc","pushedAt":"2024-05-24T12:56:50.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"use stat for efficiency","shortMessageHtmlLink":"use stat for efficiency"}},{"before":null,"after":"ce0bca085cea27b33b8271853a1325efac61556e","ref":"refs/heads/fix_cli_fileproc","pushedAt":"2024-05-24T12:44:22.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"CLI fixes: file processing options, mtime, and tests","shortMessageHtmlLink":"CLI fixes: file processing options, mtime, and tests"}},{"before":"6d6ebffec552b1d7d5d8e8b068a6efe50bc7871f","after":null,"ref":"refs/heads/add_meta","pushedAt":"2024-05-22T16:27:28.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"}},{"before":"f21f2935271f9c14a75bc23e775c61118d080e45","after":"28793934248a84fccd285b05f1e6367033f8b7ba","ref":"refs/heads/master","pushedAt":"2024-05-22T16:27:27.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"metadata: add author XPath extractors (#567)\n\n* metadata: add author XPaths\r\n\r\n* add @data-testid with test","shortMessageHtmlLink":"metadata: add author XPath extractors (#567)"}},{"before":"0d56c02ddf85d96ccbbd995eeb2af5005577728c","after":"6d6ebffec552b1d7d5d8e8b068a6efe50bc7871f","ref":"refs/heads/add_meta","pushedAt":"2024-05-22T16:22:13.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"add @data-testid with test","shortMessageHtmlLink":"add @data-testid with test"}},{"before":"1ce0e76ced5d3589a1fbe7aa17fc35a96c3c431a","after":"f21f2935271f9c14a75bc23e775c61118d080e45","ref":"refs/heads/master","pushedAt":"2024-05-21T10:48:49.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"docs: fix typos (#603)\n\n* fix typos\r\n\r\nno functional change\r\n\r\n* Update evaldata.py\r\n\r\n---------\r\n\r\nCo-authored-by: Adrien Barbaresi ","shortMessageHtmlLink":"docs: fix typos (#603)"}},{"before":"090eda6964e99423733033230a9f805d0fdc3117","after":null,"ref":"refs/heads/fix_txt_lists","pushedAt":"2024-05-16T15:24:21.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"}},{"before":"9307d90a3c0b4639e4dc4f02b7be827a1fe5fa6d","after":"1ce0e76ced5d3589a1fbe7aa17fc35a96c3c431a","ref":"refs/heads/master","pushedAt":"2024-05-16T15:24:20.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"fix: list spacing in TXT output (#598)","shortMessageHtmlLink":"fix: list spacing in TXT output (#598)"}},{"before":"f98f557b236e8eaf646e24c68d7e28950e065473","after":"9307d90a3c0b4639e4dc4f02b7be827a1fe5fa6d","ref":"refs/heads/master","pushedAt":"2024-05-16T11:47:26.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"Port of is_probably_readerable from mozilla (#587)\n\n* port of is_probably_readerable from mozilla\r\n\r\n* change xpath selector\r\n\r\n* test: add unit test\r\n\r\n* test: fixes\r\n\r\n* fix cli test\r\n\r\n* add tests for uncovered lines and fix xpath\r\n\r\n* fix test and lint error\r\n\r\n* switch xpath to use //div/br and use parent\r\n\r\n* minor changes\r\n\r\n* order imports","shortMessageHtmlLink":"Port of is_probably_readerable from mozilla (#587)"}},{"before":null,"after":"090eda6964e99423733033230a9f805d0fdc3117","ref":"refs/heads/fix_txt_lists","pushedAt":"2024-05-16T11:35:14.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"fix: list spacing in TXT output","shortMessageHtmlLink":"fix: list spacing in TXT output"}},{"before":"7abf8fe6f903fb292f66e338ba1057cea4639baa","after":null,"ref":"refs/heads/accept_encoding","pushedAt":"2024-05-15T16:12:16.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"}},{"before":"2f66f1c2e3474b8555c82142c46831588cb8b242","after":"f98f557b236e8eaf646e24c68d7e28950e065473","ref":"refs/heads/master","pushedAt":"2024-05-15T16:12:15.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"downloads: fix deflate decoding and add optional zstd to accepted encodings (#594)\n\n* downloads: fix deflate and add optional zstd to accepted encodings\r\n\r\n* polish\r\n\r\n* better logging and minimal version","shortMessageHtmlLink":"downloads: fix deflate decoding and add optional zstd to accepted enc…"}},{"before":"23da16aaee74364234bb742f30309d4b7b35452a","after":"7abf8fe6f903fb292f66e338ba1057cea4639baa","ref":"refs/heads/accept_encoding","pushedAt":"2024-05-15T16:04:46.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"better logging and minimal version","shortMessageHtmlLink":"better logging and minimal version"}},{"before":"c5d0bf078f12b8f47611086058375a49c252af86","after":"23da16aaee74364234bb742f30309d4b7b35452a","ref":"refs/heads/accept_encoding","pushedAt":"2024-05-15T13:01:46.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"polish","shortMessageHtmlLink":"polish"}},{"before":null,"after":"c5d0bf078f12b8f47611086058375a49c252af86","ref":"refs/heads/accept_encoding","pushedAt":"2024-05-15T12:39:54.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"downloads: fix deflate and add optional zstd to accepted encodings","shortMessageHtmlLink":"downloads: fix deflate and add optional zstd to accepted encodings"}},{"before":"e114a47ed3d3577e7150bf332f388fd1a43d0d54","after":null,"ref":"refs/heads/update_justext","pushedAt":"2024-05-13T11:28:04.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"}},{"before":"ef32fe753a2f3bece8d9e191e1b00866b4710da1","after":"2f66f1c2e3474b8555c82142c46831588cb8b242","ref":"refs/heads/master","pushedAt":"2024-05-13T11:28:03.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"setup: update justext and lxml dependencies (#593)\n\n* setup: update justext and lxml dependencies\r\n\r\n* test lxml update\r\n\r\n* add CI test\r\n\r\n* restore setup clause","shortMessageHtmlLink":"setup: update justext and lxml dependencies (#593)"}},{"before":"e00b3c9f38ebd488d415a2996afd73a022ee7312","after":"e114a47ed3d3577e7150bf332f388fd1a43d0d54","ref":"refs/heads/update_justext","pushedAt":"2024-05-13T11:01:01.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"restore setup clause","shortMessageHtmlLink":"restore setup clause"}},{"before":"11ead7fa0d4cdacf7697293688578014c8b8a6bd","after":"e00b3c9f38ebd488d415a2996afd73a022ee7312","ref":"refs/heads/update_justext","pushedAt":"2024-05-13T10:55:38.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"add CI test","shortMessageHtmlLink":"add CI test"}},{"before":"e2bdc0d48678eeb4e50ea322910a42b7cb888a01","after":"11ead7fa0d4cdacf7697293688578014c8b8a6bd","ref":"refs/heads/update_justext","pushedAt":"2024-05-13T10:44:39.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"test lxml update","shortMessageHtmlLink":"test lxml update"}},{"before":null,"after":"e2bdc0d48678eeb4e50ea322910a42b7cb888a01","ref":"refs/heads/update_justext","pushedAt":"2024-05-13T10:28:20.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"setup: update justext and lxml dependencies","shortMessageHtmlLink":"setup: update justext and lxml dependencies"}},{"before":"1d63fb127932d27baa1b59eff4933e7a755c1629","after":null,"ref":"refs/heads/simplify_len_test","pushedAt":"2024-05-08T11:02:32.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"}},{"before":"92bdd6e457c1189d751a0d0d42115f4360e863c8","after":"ef32fe753a2f3bece8d9e191e1b00866b4710da1","ref":"refs/heads/master","pushedAt":"2024-05-08T11:02:31.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"simplify code: unique function for length tests (#591)","shortMessageHtmlLink":"simplify code: unique function for length tests (#591)"}},{"before":null,"after":"1d63fb127932d27baa1b59eff4933e7a755c1629","ref":"refs/heads/simplify_len_test","pushedAt":"2024-05-08T10:19:52.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"simplify code: unique function for length tests","shortMessageHtmlLink":"simplify code: unique function for length tests"}},{"before":"af0822c7bde377cf22704b0d65edd4f53f505c22","after":null,"ref":"refs/heads/fix_robots_download","pushedAt":"2024-05-08T09:58:00.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"}},{"before":"efe38bbbe25d126f87478d122d9283835ac20bdf","after":"92bdd6e457c1189d751a0d0d42115f4360e863c8","ref":"refs/heads/master","pushedAt":"2024-05-08T09:57:59.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"spider fix: use internal download utilities for robots.txt (#590)\n\n* spider fix: use internal download utilities for robots.txt\r\n\r\n* separate function and tests","shortMessageHtmlLink":"spider fix: use internal download utilities for robots.txt (#590)"}},{"before":"13c868f03b8d412367c6b0be8517099fe5e5bb94","after":"af0822c7bde377cf22704b0d65edd4f53f505c22","ref":"refs/heads/fix_robots_download","pushedAt":"2024-05-08T09:43:28.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"separate function and tests","shortMessageHtmlLink":"separate function and tests"}},{"before":null,"after":"13c868f03b8d412367c6b0be8517099fe5e5bb94","ref":"refs/heads/fix_robots_download","pushedAt":"2024-05-08T09:13:39.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"adbar","name":"Adrien Barbaresi","path":"/adbar","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2125866?s=80&v=4"},"commit":{"message":"spider fix: use internal download utilities for robots.txt","shortMessageHtmlLink":"spider fix: use internal download utilities for robots.txt"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEUxp3HQA","startCursor":null,"endCursor":null}},"title":"Activity · adbar/trafilatura"}