File tree Expand file tree Collapse file tree 4 files changed +12
-5
lines changed Expand file tree Collapse file tree 4 files changed +12
-5
lines changed Original file line number Diff line number Diff line change @@ -11,6 +11,7 @@ classifiers = [
11
11
" License :: OSI Approved :: MIT License" ,
12
12
" Operating System :: Unix" ,
13
13
" Operating System :: POSIX" ,
14
+ " Operating System :: MacOS" ,
14
15
" Operating System :: Microsoft :: Windows" ,
15
16
" Natural Language :: Icelandic" ,
16
17
" Programming Language :: Python" ,
@@ -19,6 +20,7 @@ classifiers = [
19
20
" Programming Language :: Python :: 3.10" ,
20
21
" Programming Language :: Python :: 3.11" ,
21
22
" Programming Language :: Python :: 3.12" ,
23
+ " Programming Language :: Python :: 3.13" ,
22
24
" Programming Language :: Python :: Implementation :: CPython" ,
23
25
" Programming Language :: Python :: Implementation :: PyPy" ,
24
26
" Topic :: Software Development :: Libraries :: Python Modules" ,
Original file line number Diff line number Diff line change @@ -717,9 +717,8 @@ def roman_to_int(s: str) -> int:
717
717
# Króna amount strings allowed before a number, e.g. "kr. 9.900"
718
718
ISK_AMOUNT_PRECEDING = frozenset (("kr." , "kr" , "krónur" ))
719
719
720
- # URL prefixes. Note that this list should not contain www since
721
- # www.something.com is a domain token, not a URL token.
722
- URL_PREFIXES = (
720
+ # URI scheme prefixes
721
+ URI_PREFIXES = (
723
722
"http://" ,
724
723
"https://" ,
725
724
"file://" ,
@@ -735,6 +734,12 @@ def roman_to_int(s: str) -> int:
735
734
"telnet://" ,
736
735
"udp://" ,
737
736
"vnc://" ,
737
+ "irc://" ,
738
+ "nntp://" ,
739
+ "wss://" ,
740
+ "ws://" ,
741
+ "xmpp://" ,
742
+ "mtqp://" ,
738
743
)
739
744
740
745
TOP_LEVEL_DOMAINS = frozenset (
Original file line number Diff line number Diff line change @@ -1848,7 +1848,7 @@ def parse_mixed(
1848
1848
ate = True
1849
1849
1850
1850
rtxt = rt .txt
1851
- if rtxt and rtxt .startswith (URL_PREFIXES ):
1851
+ if rtxt and rtxt .startswith (URI_PREFIXES ):
1852
1852
# Handle URL: cut RIGHT_PUNCTUATION characters off its end,
1853
1853
# even though many of them are actually allowed according to
1854
1854
# the IETF RFC
Original file line number Diff line number Diff line change @@ -46,7 +46,7 @@ def strip_originals(tokens: list[Tok]) -> list[Tok]:
46
46
"""Remove origin tracking info from a list of tokens.
47
47
This is useful for simplifying tests where we don't care about tracking
48
48
origins.
49
- XXX : This could be removed if we get a feature to disable origin
49
+ TODO : This could be removed if we get a feature to disable origin
50
50
tracking during tokenization.
51
51
"""
52
52
You can’t perform that action at this time.
0 commit comments