python · sleiderr · May 15, 2023 · May 15, 2023 · May 15, 2023 · May 15, 2023
diff --git a/Lib/netrc.py b/Lib/netrc.py
@@ -2,7 +2,8 @@
 
 # Module and documentation by Eric S. Raymond, 21 Dec 1998
 
-import os, stat
+import os
+import stat
-import os
-import stat
+import os, stat
-import os
-import stat
+import os, stat
 
 __all__ = ["netrc", "NetrcParseError"]
 
@@ -22,6 +23,7 @@ def __str__(self):
 class _netrclex:
     def __init__(self, fp):
         self.lineno = 1
+        self.dontskip = False
         self.instream = fp
         self.whitespace = "\n\t\r "
         self.pushback = []
@@ -33,30 +35,29 @@ def _read_char(self):
         return ch
 
     def get_token(self):
+        self.dontskip = False
         if self.pushback:
             return self.pushback.pop(0)
         token = ""
-        fiter = iter(self._read_char, "")
-        for ch in fiter:
-            if ch in self.whitespace:
+        enquoted = False
+        while ch := self._read_char():
+            if ch == '\\':
+                ch = self._read_char()
+                token += ch
                 continue
+            if ch in self.whitespace and not enquoted:
+                if token == "":
+                    continue
+                if ch == '\n':
+                    self.dontskip = True
+                return token
             if ch == '"':
-                for ch in fiter:
-                    if ch == '"':
-                        return token
-                    elif ch == "\\":
-                        ch = self._read_char()
-                    token += ch
+                if enquoted:
+                    return token
+                enquoted = True
+                continue
             else:
-                if ch == "\\":
-                    ch = self._read_char()
                 token += ch
-                for ch in fiter:
-                    if ch in self.whitespace:
-                        return token
-                    elif ch == "\\":
-                        ch = self._read_char()
-                    token += ch
         return token
 
     def push_token(self, token):
@@ -66,7 +67,7 @@ def push_token(self, token):
 class netrc:
     def __init__(self, file=None):
         default_netrc = file is None
-        if file is None:
+        if default_netrc:
             file = os.path.join(os.path.expanduser("~"), ".netrc")
         self.hosts = {}
         self.macros = {}
@@ -81,13 +82,15 @@ def _parse(self, file, fp, default_netrc):
         lexer = _netrclex(fp)
         while 1:
             # Look for a machine, default, or macdef top-level keyword
-            saved_lineno = lexer.lineno
-            toplevel = tt = lexer.get_token()
+            tt = lexer.get_token()
             if not tt:
                 break
             elif tt[0] == '#':
-                if lexer.lineno == saved_lineno and len(tt) == 1:
+                # For top level tokens, we skip line if the # is followed
+                # by a space / newline. Otherwise, we only skip the token.
+                if tt == '#' and not lexer.dontskip:
-                if tt == '#' and not lexer.dontskip:
+                if len(tt) == 1 and not lexer.dontskip:
-                if tt == '#' and not lexer.dontskip:
+                if len(tt) == 1 and not lexer.dontskip:
                     lexer.instream.readline()
+                    lexer.lineno += 1
                 continue
             elif tt == 'machine':
                 entryname = lexer.get_token()
@@ -98,6 +101,7 @@ def _parse(self, file, fp, default_netrc):
                 self.macros[entryname] = []
                 while 1:
                     line = lexer.instream.readline()
+                    lexer.lineno += 1
                     if not line:
                         raise NetrcParseError(
                             "Macro definition missing null line terminator.",
@@ -114,17 +118,18 @@ def _parse(self, file, fp, default_netrc):
                     "bad toplevel token %r" % tt, file, lexer.lineno)
 
             if not entryname:
-                raise NetrcParseError("missing %r name" % tt, file, lexer.lineno)
+                raise NetrcParseError(
+                    "missing %r name" % tt, file, lexer.lineno)
-                raise NetrcParseError(
-                    "missing %r name" % tt, file, lexer.lineno)
+                raise NetrcParseError("missing %r name" % tt, file, lexer.lineno)
-                raise NetrcParseError(
-                    "missing %r name" % tt, file, lexer.lineno)
+                raise NetrcParseError("missing %r name" % tt, file, lexer.lineno)
 
             # We're looking at start of an entry for a named machine or default.
             login = account = password = ''
             self.hosts[entryname] = {}
             while 1:
-                prev_lineno = lexer.lineno
                 tt = lexer.get_token()
                 if tt.startswith('#'):
-                    if lexer.lineno == prev_lineno:
+                    if not lexer.dontskip:
                         lexer.instream.readline()
+                        lexer.lineno += 1
                     continue
                 if tt in {'', 'machine', 'default', 'macdef'}:
                     self.hosts[entryname] = (login, account, password)
@@ -165,12 +170,7 @@ def _security_check(self, fp, default_netrc, login):
 
     def authenticators(self, host):
         """Return a (user, account, password) tuple for given host."""
-        if host in self.hosts:
-            return self.hosts[host]
-        elif 'default' in self.hosts:
-            return self.hosts['default']
-        else:
-            return None
+        return self.hosts.get(host, self.hosts.get('default'))
 
     def __repr__(self):
         """Dump the class data in the format of a .netrc file."""
@@ -188,5 +188,6 @@ def __repr__(self):
             rep += "\n"
         return rep
-        return rep
+        return rep
+
+if __name__ == '__main__':
+    print(netrc())
-        return rep
+        return rep
+
+if __name__ == '__main__':
+    print(netrc())
 
+
 if __name__ == '__main__':
     print(netrc())
diff --git a/Lib/test/test_netrc.py b/Lib/test/test_netrc.py
@@ -1,4 +1,8 @@
-import netrc, os, unittest, sys, textwrap
+import netrc
+import os
+import sys
+import textwrap
+import unittest
 from test.support import os_helper, run_unittest
 
 try:
@@ -8,6 +12,7 @@
 
 temp_filename = os_helper.TESTFN
 
+
 class NetrcTestCase(unittest.TestCase):
 
     def make_nrc(self, test_data):
@@ -215,6 +220,14 @@ def test_comment_before_machine_line_hash_only(self):
             machine bar.domain.com login foo password pass
             """)
 
+    def test_comment_after_new_line(self):
+        self._test_comment("""\
+            machine foo.domain.com login bar password pass
+
+            # TEST
+            machine bar.domain.com login foo password pass
+            """)
+
     def test_comment_after_machine_line(self):
         self._test_comment("""\
             machine foo.domain.com login bar password pass
@@ -251,6 +264,13 @@ def test_comment_after_machine_line_hash_only(self):
             #
             """)
 
+    def test_comment_at_first_line(self):
+        self._test_comment("""
+            # TEST
+            machine foo.domain.com login bar password pass
+            machine bar.domain.com login foo password pass
+            """)
+
     def test_comment_at_end_of_machine_line(self):
         self._test_comment("""\
             machine foo.domain.com login bar password pass # comment
@@ -308,8 +328,10 @@ def test_security(self):
             self.assertEqual(nrc.hosts['foo.domain.com'],
                              ('anonymous', '', 'pass'))
 
+
 def test_main():
     run_unittest(NetrcTestCase)
 
+
 if __name__ == "__main__":
     test_main()
diff --git a/Misc/NEWS.d/next/Library/2023-05-15-17-22-53.gh-issue-104306.YMiegg.rst b/Misc/NEWS.d/next/Library/2023-05-15-17-22-53.gh-issue-104306.YMiegg.rst
@@ -0,0 +1 @@
+Fix incorrect comment parsing in the ``netrc`` module
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1 @@
		Fix incorrect comment parsing in the ``netrc`` module
sleiderr marked this conversation as resolved. Outdated Show resolved Hide resolved