Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1 | r"""UUID objects (universally unique identifiers) according to RFC 4122. |
| 2 | |
| 3 | This module provides immutable UUID objects (class UUID) and the functions |
| 4 | uuid1(), uuid3(), uuid4(), uuid5() for generating version 1, 3, 4, and 5 |
| 5 | UUIDs as specified in RFC 4122. |
| 6 | |
| 7 | If all you want is a unique ID, you should probably call uuid1() or uuid4(). |
| 8 | Note that uuid1() may compromise privacy since it creates a UUID containing |
| 9 | the computer's network address. uuid4() creates a random UUID. |
| 10 | |
| 11 | Typical usage: |
| 12 | |
| 13 | >>> import uuid |
| 14 | |
| 15 | # make a UUID based on the host ID and current time |
Georg Brandl | 1d523e1 | 2009-12-19 18:23:28 +0000 | [diff] [blame] | 16 | >>> uuid.uuid1() # doctest: +SKIP |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 17 | UUID('a8098c1a-f86e-11da-bd1a-00112444be1e') |
| 18 | |
| 19 | # make a UUID using an MD5 hash of a namespace UUID and a name |
| 20 | >>> uuid.uuid3(uuid.NAMESPACE_DNS, 'python.org') |
| 21 | UUID('6fa459ea-ee8a-3ca4-894e-db77e160355e') |
| 22 | |
| 23 | # make a random UUID |
Georg Brandl | 1d523e1 | 2009-12-19 18:23:28 +0000 | [diff] [blame] | 24 | >>> uuid.uuid4() # doctest: +SKIP |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 25 | UUID('16fd2706-8baf-433b-82eb-8c7fada847da') |
| 26 | |
| 27 | # make a UUID using a SHA-1 hash of a namespace UUID and a name |
| 28 | >>> uuid.uuid5(uuid.NAMESPACE_DNS, 'python.org') |
| 29 | UUID('886313e1-3b8a-5372-9b90-0c9aee199e5d') |
| 30 | |
| 31 | # make a UUID from a string of hex digits (braces and hyphens ignored) |
| 32 | >>> x = uuid.UUID('{00010203-0405-0607-0809-0a0b0c0d0e0f}') |
| 33 | |
| 34 | # convert a UUID to a string of hex digits in standard form |
| 35 | >>> str(x) |
| 36 | '00010203-0405-0607-0809-0a0b0c0d0e0f' |
| 37 | |
| 38 | # get the raw 16 bytes of the UUID |
| 39 | >>> x.bytes |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 40 | b'\x00\x01\x02\x03\x04\x05\x06\x07\x08\t\n\x0b\x0c\r\x0e\x0f' |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 41 | |
| 42 | # make a UUID from a 16-byte string |
| 43 | >>> uuid.UUID(bytes=x.bytes) |
| 44 | UUID('00010203-0405-0607-0809-0a0b0c0d0e0f') |
| 45 | """ |
| 46 | |
Benjamin Peterson | 788cb52 | 2015-10-29 20:38:04 -0700 | [diff] [blame] | 47 | import os |
Antoine Pitrou | a106aec | 2017-09-28 23:03:06 +0200 | [diff] [blame] | 48 | import sys |
Benjamin Peterson | 788cb52 | 2015-10-29 20:38:04 -0700 | [diff] [blame] | 49 | |
Ethan Furman | a02cb47 | 2021-04-21 10:20:44 -0700 | [diff] [blame] | 50 | from enum import Enum, _simple_enum |
Barry Warsaw | 8c130d7 | 2017-02-18 15:45:49 -0500 | [diff] [blame] | 51 | |
| 52 | |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 53 | __author__ = 'Ka-Ping Yee <ping@zesty.ca>' |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 54 | |
Michael Felt | 3a1d50e | 2019-06-15 17:52:29 +0200 | [diff] [blame] | 55 | # The recognized platforms - known behaviors |
Steve Dower | bf2f76e | 2020-07-22 00:15:47 +0100 | [diff] [blame] | 56 | if sys.platform in ('win32', 'darwin'): |
| 57 | _AIX = _LINUX = False |
| 58 | else: |
| 59 | import platform |
| 60 | _platform_system = platform.system() |
| 61 | _AIX = _platform_system == 'AIX' |
| 62 | _LINUX = _platform_system == 'Linux' |
Michael Felt | 3a1d50e | 2019-06-15 17:52:29 +0200 | [diff] [blame] | 63 | |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 64 | _MAC_DELIM = b':' |
| 65 | _MAC_OMITS_LEADING_ZEROES = False |
| 66 | if _AIX: |
| 67 | _MAC_DELIM = b'.' |
| 68 | _MAC_OMITS_LEADING_ZEROES = True |
| 69 | |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 70 | RESERVED_NCS, RFC_4122, RESERVED_MICROSOFT, RESERVED_FUTURE = [ |
| 71 | 'reserved for NCS compatibility', 'specified in RFC 4122', |
| 72 | 'reserved for Microsoft compatibility', 'reserved for future definition'] |
| 73 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 74 | int_ = int # The built-in int type |
| 75 | bytes_ = bytes # The built-in bytes type |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 76 | |
Barry Warsaw | 8c130d7 | 2017-02-18 15:45:49 -0500 | [diff] [blame] | 77 | |
Ethan Furman | a02cb47 | 2021-04-21 10:20:44 -0700 | [diff] [blame] | 78 | @_simple_enum(Enum) |
| 79 | class SafeUUID: |
Barry Warsaw | 8c130d7 | 2017-02-18 15:45:49 -0500 | [diff] [blame] | 80 | safe = 0 |
| 81 | unsafe = -1 |
| 82 | unknown = None |
| 83 | |
| 84 | |
| 85 | class UUID: |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 86 | """Instances of the UUID class represent UUIDs as specified in RFC 4122. |
| 87 | UUID objects are immutable, hashable, and usable as dictionary keys. |
| 88 | Converting a UUID to a string with str() yields something in the form |
| 89 | '12345678-1234-1234-1234-123456789abc'. The UUID constructor accepts |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 90 | five possible forms: a similar string of hexadecimal digits, or a tuple |
| 91 | of six integer fields (with 32-bit, 16-bit, 16-bit, 8-bit, 8-bit, and |
| 92 | 48-bit values respectively) as an argument named 'fields', or a string |
| 93 | of 16 bytes (with all the integer fields in big-endian order) as an |
| 94 | argument named 'bytes', or a string of 16 bytes (with the first three |
| 95 | fields in little-endian order) as an argument named 'bytes_le', or a |
| 96 | single 128-bit integer as an argument named 'int'. |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 97 | |
| 98 | UUIDs have these read-only attributes: |
| 99 | |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 100 | bytes the UUID as a 16-byte string (containing the six |
| 101 | integer fields in big-endian byte order) |
| 102 | |
| 103 | bytes_le the UUID as a 16-byte string (with time_low, time_mid, |
| 104 | and time_hi_version in little-endian byte order) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 105 | |
| 106 | fields a tuple of the six integer fields of the UUID, |
| 107 | which are also available as six individual attributes |
| 108 | and two derived attributes: |
| 109 | |
| 110 | time_low the first 32 bits of the UUID |
| 111 | time_mid the next 16 bits of the UUID |
| 112 | time_hi_version the next 16 bits of the UUID |
| 113 | clock_seq_hi_variant the next 8 bits of the UUID |
| 114 | clock_seq_low the next 8 bits of the UUID |
| 115 | node the last 48 bits of the UUID |
| 116 | |
| 117 | time the 60-bit timestamp |
| 118 | clock_seq the 14-bit sequence number |
| 119 | |
| 120 | hex the UUID as a 32-character hexadecimal string |
| 121 | |
| 122 | int the UUID as a 128-bit integer |
| 123 | |
| 124 | urn the UUID as a URN as specified in RFC 4122 |
| 125 | |
| 126 | variant the UUID variant (one of the constants RESERVED_NCS, |
| 127 | RFC_4122, RESERVED_MICROSOFT, or RESERVED_FUTURE) |
| 128 | |
| 129 | version the UUID version number (1 through 5, meaningful only |
| 130 | when the variant is RFC_4122) |
Barry Warsaw | 8c130d7 | 2017-02-18 15:45:49 -0500 | [diff] [blame] | 131 | |
| 132 | is_safe An enum indicating whether the UUID has been generated in |
| 133 | a way that is safe for multiprocessing applications, via |
| 134 | uuid_generate_time_safe(3). |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 135 | """ |
| 136 | |
David H | f1d8e7c | 2019-01-17 13:16:51 +0100 | [diff] [blame] | 137 | __slots__ = ('int', 'is_safe', '__weakref__') |
Tal Einat | 3e2b29d | 2018-09-06 14:34:25 +0300 | [diff] [blame] | 138 | |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 139 | def __init__(self, hex=None, bytes=None, bytes_le=None, fields=None, |
Barry Warsaw | 8c130d7 | 2017-02-18 15:45:49 -0500 | [diff] [blame] | 140 | int=None, version=None, |
| 141 | *, is_safe=SafeUUID.unknown): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 142 | r"""Create a UUID from either a string of 32 hexadecimal digits, |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 143 | a string of 16 bytes as the 'bytes' argument, a string of 16 bytes |
| 144 | in little-endian order as the 'bytes_le' argument, a tuple of six |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 145 | integers (32-bit time_low, 16-bit time_mid, 16-bit time_hi_version, |
| 146 | 8-bit clock_seq_hi_variant, 8-bit clock_seq_low, 48-bit node) as |
| 147 | the 'fields' argument, or a single 128-bit integer as the 'int' |
| 148 | argument. When a string of hex digits is given, curly braces, |
| 149 | hyphens, and a URN prefix are all optional. For example, these |
| 150 | expressions all yield the same UUID: |
| 151 | |
| 152 | UUID('{12345678-1234-5678-1234-567812345678}') |
| 153 | UUID('12345678123456781234567812345678') |
| 154 | UUID('urn:uuid:12345678-1234-5678-1234-567812345678') |
| 155 | UUID(bytes='\x12\x34\x56\x78'*4) |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 156 | UUID(bytes_le='\x78\x56\x34\x12\x34\x12\x78\x56' + |
| 157 | '\x12\x34\x56\x78\x12\x34\x56\x78') |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 158 | UUID(fields=(0x12345678, 0x1234, 0x5678, 0x12, 0x34, 0x567812345678)) |
| 159 | UUID(int=0x12345678123456781234567812345678) |
| 160 | |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 161 | Exactly one of 'hex', 'bytes', 'bytes_le', 'fields', or 'int' must |
| 162 | be given. The 'version' argument is optional; if given, the resulting |
| 163 | UUID will have its variant and version set according to RFC 4122, |
| 164 | overriding the given 'hex', 'bytes', 'bytes_le', 'fields', or 'int'. |
Barry Warsaw | 8c130d7 | 2017-02-18 15:45:49 -0500 | [diff] [blame] | 165 | |
| 166 | is_safe is an enum exposed as an attribute on the instance. It |
| 167 | indicates whether the UUID has been generated in a way that is safe |
| 168 | for multiprocessing applications, via uuid_generate_time_safe(3). |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 169 | """ |
| 170 | |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 171 | if [hex, bytes, bytes_le, fields, int].count(None) != 4: |
Berker Peksag | d02eb8a | 2016-03-20 16:49:10 +0200 | [diff] [blame] | 172 | raise TypeError('one of the hex, bytes, bytes_le, fields, ' |
| 173 | 'or int arguments must be given') |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 174 | if hex is not None: |
| 175 | hex = hex.replace('urn:', '').replace('uuid:', '') |
| 176 | hex = hex.strip('{}').replace('-', '') |
| 177 | if len(hex) != 32: |
| 178 | raise ValueError('badly formed hexadecimal UUID string') |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 179 | int = int_(hex, 16) |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 180 | if bytes_le is not None: |
| 181 | if len(bytes_le) != 16: |
| 182 | raise ValueError('bytes_le is not a 16-char string') |
Serhiy Storchaka | fa9be4f | 2014-09-06 22:14:04 +0300 | [diff] [blame] | 183 | bytes = (bytes_le[4-1::-1] + bytes_le[6-1:4-1:-1] + |
| 184 | bytes_le[8-1:6-1:-1] + bytes_le[8:]) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 185 | if bytes is not None: |
| 186 | if len(bytes) != 16: |
| 187 | raise ValueError('bytes is not a 16-char string') |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 188 | assert isinstance(bytes, bytes_), repr(bytes) |
Philip Jenvey | 1221f6b | 2013-08-29 18:33:50 -0700 | [diff] [blame] | 189 | int = int_.from_bytes(bytes, byteorder='big') |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 190 | if fields is not None: |
| 191 | if len(fields) != 6: |
| 192 | raise ValueError('fields is not a 6-tuple') |
| 193 | (time_low, time_mid, time_hi_version, |
| 194 | clock_seq_hi_variant, clock_seq_low, node) = fields |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 195 | if not 0 <= time_low < 1<<32: |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 196 | raise ValueError('field 1 out of range (need a 32-bit value)') |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 197 | if not 0 <= time_mid < 1<<16: |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 198 | raise ValueError('field 2 out of range (need a 16-bit value)') |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 199 | if not 0 <= time_hi_version < 1<<16: |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 200 | raise ValueError('field 3 out of range (need a 16-bit value)') |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 201 | if not 0 <= clock_seq_hi_variant < 1<<8: |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 202 | raise ValueError('field 4 out of range (need an 8-bit value)') |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 203 | if not 0 <= clock_seq_low < 1<<8: |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 204 | raise ValueError('field 5 out of range (need an 8-bit value)') |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 205 | if not 0 <= node < 1<<48: |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 206 | raise ValueError('field 6 out of range (need a 48-bit value)') |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 207 | clock_seq = (clock_seq_hi_variant << 8) | clock_seq_low |
| 208 | int = ((time_low << 96) | (time_mid << 80) | |
| 209 | (time_hi_version << 64) | (clock_seq << 48) | node) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 210 | if int is not None: |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 211 | if not 0 <= int < 1<<128: |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 212 | raise ValueError('int is out of range (need a 128-bit value)') |
| 213 | if version is not None: |
| 214 | if not 1 <= version <= 5: |
| 215 | raise ValueError('illegal version number') |
| 216 | # Set the variant to RFC 4122. |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 217 | int &= ~(0xc000 << 48) |
| 218 | int |= 0x8000 << 48 |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 219 | # Set the version number. |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 220 | int &= ~(0xf000 << 64) |
| 221 | int |= version << 76 |
Tal Einat | 3e2b29d | 2018-09-06 14:34:25 +0300 | [diff] [blame] | 222 | object.__setattr__(self, 'int', int) |
| 223 | object.__setattr__(self, 'is_safe', is_safe) |
| 224 | |
| 225 | def __getstate__(self): |
Tal Einat | 5475253 | 2018-09-10 16:11:04 +0300 | [diff] [blame] | 226 | d = {'int': self.int} |
| 227 | if self.is_safe != SafeUUID.unknown: |
| 228 | # is_safe is a SafeUUID instance. Return just its value, so that |
| 229 | # it can be un-pickled in older Python versions without SafeUUID. |
| 230 | d['is_safe'] = self.is_safe.value |
Tal Einat | 3e2b29d | 2018-09-06 14:34:25 +0300 | [diff] [blame] | 231 | return d |
| 232 | |
| 233 | def __setstate__(self, state): |
Tal Einat | 5475253 | 2018-09-10 16:11:04 +0300 | [diff] [blame] | 234 | object.__setattr__(self, 'int', state['int']) |
| 235 | # is_safe was added in 3.7; it is also omitted when it is "unknown" |
| 236 | object.__setattr__(self, 'is_safe', |
| 237 | SafeUUID(state['is_safe']) |
| 238 | if 'is_safe' in state else SafeUUID.unknown) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 239 | |
Guido van Rossum | 47b9ff6 | 2006-08-24 00:41:19 +0000 | [diff] [blame] | 240 | def __eq__(self, other): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 241 | if isinstance(other, UUID): |
Guido van Rossum | 47b9ff6 | 2006-08-24 00:41:19 +0000 | [diff] [blame] | 242 | return self.int == other.int |
| 243 | return NotImplemented |
| 244 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 245 | # Q. What's the value of being able to sort UUIDs? |
| 246 | # A. Use them as keys in a B-Tree or similar mapping. |
Guido van Rossum | 47b9ff6 | 2006-08-24 00:41:19 +0000 | [diff] [blame] | 247 | |
| 248 | def __lt__(self, other): |
| 249 | if isinstance(other, UUID): |
| 250 | return self.int < other.int |
| 251 | return NotImplemented |
| 252 | |
| 253 | def __gt__(self, other): |
| 254 | if isinstance(other, UUID): |
| 255 | return self.int > other.int |
| 256 | return NotImplemented |
| 257 | |
| 258 | def __le__(self, other): |
| 259 | if isinstance(other, UUID): |
| 260 | return self.int <= other.int |
| 261 | return NotImplemented |
| 262 | |
| 263 | def __ge__(self, other): |
| 264 | if isinstance(other, UUID): |
| 265 | return self.int >= other.int |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 266 | return NotImplemented |
| 267 | |
| 268 | def __hash__(self): |
| 269 | return hash(self.int) |
| 270 | |
| 271 | def __int__(self): |
| 272 | return self.int |
| 273 | |
| 274 | def __repr__(self): |
Serhiy Storchaka | 465e60e | 2014-07-25 23:36:00 +0300 | [diff] [blame] | 275 | return '%s(%r)' % (self.__class__.__name__, str(self)) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 276 | |
| 277 | def __setattr__(self, name, value): |
| 278 | raise TypeError('UUID objects are immutable') |
| 279 | |
| 280 | def __str__(self): |
| 281 | hex = '%032x' % self.int |
| 282 | return '%s-%s-%s-%s-%s' % ( |
| 283 | hex[:8], hex[8:12], hex[12:16], hex[16:20], hex[20:]) |
| 284 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 285 | @property |
| 286 | def bytes(self): |
Serhiy Storchaka | fa9be4f | 2014-09-06 22:14:04 +0300 | [diff] [blame] | 287 | return self.int.to_bytes(16, 'big') |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 288 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 289 | @property |
| 290 | def bytes_le(self): |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 291 | bytes = self.bytes |
Serhiy Storchaka | fa9be4f | 2014-09-06 22:14:04 +0300 | [diff] [blame] | 292 | return (bytes[4-1::-1] + bytes[6-1:4-1:-1] + bytes[8-1:6-1:-1] + |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 293 | bytes[8:]) |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 294 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 295 | @property |
| 296 | def fields(self): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 297 | return (self.time_low, self.time_mid, self.time_hi_version, |
| 298 | self.clock_seq_hi_variant, self.clock_seq_low, self.node) |
| 299 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 300 | @property |
| 301 | def time_low(self): |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 302 | return self.int >> 96 |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 303 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 304 | @property |
| 305 | def time_mid(self): |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 306 | return (self.int >> 80) & 0xffff |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 307 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 308 | @property |
| 309 | def time_hi_version(self): |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 310 | return (self.int >> 64) & 0xffff |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 311 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 312 | @property |
| 313 | def clock_seq_hi_variant(self): |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 314 | return (self.int >> 56) & 0xff |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 315 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 316 | @property |
| 317 | def clock_seq_low(self): |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 318 | return (self.int >> 48) & 0xff |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 319 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 320 | @property |
| 321 | def time(self): |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 322 | return (((self.time_hi_version & 0x0fff) << 48) | |
| 323 | (self.time_mid << 32) | self.time_low) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 324 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 325 | @property |
| 326 | def clock_seq(self): |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 327 | return (((self.clock_seq_hi_variant & 0x3f) << 8) | |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 328 | self.clock_seq_low) |
| 329 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 330 | @property |
| 331 | def node(self): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 332 | return self.int & 0xffffffffffff |
| 333 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 334 | @property |
| 335 | def hex(self): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 336 | return '%032x' % self.int |
| 337 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 338 | @property |
| 339 | def urn(self): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 340 | return 'urn:uuid:' + str(self) |
| 341 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 342 | @property |
| 343 | def variant(self): |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 344 | if not self.int & (0x8000 << 48): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 345 | return RESERVED_NCS |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 346 | elif not self.int & (0x4000 << 48): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 347 | return RFC_4122 |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 348 | elif not self.int & (0x2000 << 48): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 349 | return RESERVED_MICROSOFT |
| 350 | else: |
| 351 | return RESERVED_FUTURE |
| 352 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 353 | @property |
| 354 | def version(self): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 355 | # The version bits are only meaningful for RFC 4122 UUIDs. |
| 356 | if self.variant == RFC_4122: |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 357 | return int((self.int >> 76) & 0xf) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 358 | |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 359 | |
| 360 | def _get_command_stdout(command, *args): |
| 361 | import io, os, shutil, subprocess |
| 362 | |
| 363 | try: |
| 364 | path_dirs = os.environ.get('PATH', os.defpath).split(os.pathsep) |
| 365 | path_dirs.extend(['/sbin', '/usr/sbin']) |
| 366 | executable = shutil.which(command, path=os.pathsep.join(path_dirs)) |
R David Murray | 4be1e24 | 2013-12-17 21:13:16 -0500 | [diff] [blame] | 367 | if executable is None: |
| 368 | return None |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 369 | # LC_ALL=C to ensure English output, stderr=DEVNULL to prevent output |
| 370 | # on stderr (Note: we don't have an example where the words we search |
| 371 | # for are actually localized, but in theory some system could do so.) |
| 372 | env = dict(os.environ) |
| 373 | env['LC_ALL'] = 'C' |
| 374 | proc = subprocess.Popen((executable,) + args, |
| 375 | stdout=subprocess.PIPE, |
| 376 | stderr=subprocess.DEVNULL, |
| 377 | env=env) |
| 378 | if not proc: |
| 379 | return None |
| 380 | stdout, stderr = proc.communicate() |
| 381 | return io.BytesIO(stdout) |
| 382 | except (OSError, subprocess.SubprocessError): |
| 383 | return None |
| 384 | |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 385 | |
Barry Warsaw | 23df2d1 | 2017-11-28 17:26:04 -0500 | [diff] [blame] | 386 | # For MAC (a.k.a. IEEE 802, or EUI-48) addresses, the second least significant |
| 387 | # bit of the first octet signifies whether the MAC address is universally (0) |
| 388 | # or locally (1) administered. Network cards from hardware manufacturers will |
| 389 | # always be universally administered to guarantee global uniqueness of the MAC |
| 390 | # address, but any particular machine may have other interfaces which are |
| 391 | # locally administered. An example of the latter is the bridge interface to |
| 392 | # the Touch Bar on MacBook Pros. |
| 393 | # |
| 394 | # This bit works out to be the 42nd bit counting from 1 being the least |
| 395 | # significant, or 1<<41. We'll prefer universally administered MAC addresses |
| 396 | # over locally administered ones since the former are globally unique, but |
| 397 | # we'll return the first of the latter found if that's all the machine has. |
| 398 | # |
| 399 | # See https://en.wikipedia.org/wiki/MAC_address#Universal_vs._local |
| 400 | |
| 401 | def _is_universal(mac): |
| 402 | return not (mac & (1 << 41)) |
| 403 | |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 404 | |
| 405 | def _find_mac_near_keyword(command, args, keywords, get_word_index): |
| 406 | """Searches a command's output for a MAC address near a keyword. |
| 407 | |
| 408 | Each line of words in the output is case-insensitively searched for |
| 409 | any of the given keywords. Upon a match, get_word_index is invoked |
| 410 | to pick a word from the line, given the index of the match. For |
| 411 | example, lambda i: 0 would get the first word on the line, while |
| 412 | lambda i: i - 1 would get the word preceding the keyword. |
| 413 | """ |
| 414 | stdout = _get_command_stdout(command, args) |
| 415 | if stdout is None: |
| 416 | return None |
| 417 | |
Barry Warsaw | 23df2d1 | 2017-11-28 17:26:04 -0500 | [diff] [blame] | 418 | first_local_mac = None |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 419 | for line in stdout: |
| 420 | words = line.lower().rstrip().split() |
| 421 | for i in range(len(words)): |
| 422 | if words[i] in keywords: |
| 423 | try: |
| 424 | word = words[get_word_index(i)] |
| 425 | mac = int(word.replace(_MAC_DELIM, b''), 16) |
| 426 | except (ValueError, IndexError): |
| 427 | # Virtual interfaces, such as those provided by |
| 428 | # VPNs, do not have a colon-delimited MAC address |
| 429 | # as expected, but a 16-byte HWAddr separated by |
| 430 | # dashes. These should be ignored in favor of a |
| 431 | # real MAC address |
| 432 | pass |
| 433 | else: |
| 434 | if _is_universal(mac): |
| 435 | return mac |
| 436 | first_local_mac = first_local_mac or mac |
Barry Warsaw | 23df2d1 | 2017-11-28 17:26:04 -0500 | [diff] [blame] | 437 | return first_local_mac or None |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 438 | |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 439 | |
Victor Stinner | ebf6bb9 | 2020-03-17 18:36:44 +0100 | [diff] [blame] | 440 | def _parse_mac(word): |
| 441 | # Accept 'HH:HH:HH:HH:HH:HH' MAC address (ex: '52:54:00:9d:0e:67'), |
| 442 | # but reject IPv6 address (ex: 'fe80::5054:ff:fe9' or '123:2:3:4:5:6:7:8'). |
| 443 | # |
| 444 | # Virtual interfaces, such as those provided by VPNs, do not have a |
| 445 | # colon-delimited MAC address as expected, but a 16-byte HWAddr separated |
| 446 | # by dashes. These should be ignored in favor of a real MAC address |
| 447 | parts = word.split(_MAC_DELIM) |
| 448 | if len(parts) != 6: |
| 449 | return |
| 450 | if _MAC_OMITS_LEADING_ZEROES: |
| 451 | # (Only) on AIX the macaddr value given is not prefixed by 0, e.g. |
| 452 | # en0 1500 link#2 fa.bc.de.f7.62.4 110854824 0 160133733 0 0 |
| 453 | # not |
| 454 | # en0 1500 link#2 fa.bc.de.f7.62.04 110854824 0 160133733 0 0 |
| 455 | if not all(1 <= len(part) <= 2 for part in parts): |
| 456 | return |
| 457 | hexstr = b''.join(part.rjust(2, b'0') for part in parts) |
| 458 | else: |
| 459 | if not all(len(part) == 2 for part in parts): |
| 460 | return |
| 461 | hexstr = b''.join(parts) |
| 462 | try: |
| 463 | return int(hexstr, 16) |
| 464 | except ValueError: |
| 465 | return |
| 466 | |
| 467 | |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 468 | def _find_mac_under_heading(command, args, heading): |
| 469 | """Looks for a MAC address under a heading in a command's output. |
| 470 | |
| 471 | The first line of words in the output is searched for the given |
| 472 | heading. Words at the same word index as the heading in subsequent |
| 473 | lines are then examined to see if they look like MAC addresses. |
| 474 | """ |
| 475 | stdout = _get_command_stdout(command, args) |
| 476 | if stdout is None: |
| 477 | return None |
| 478 | |
| 479 | keywords = stdout.readline().rstrip().split() |
| 480 | try: |
| 481 | column_index = keywords.index(heading) |
| 482 | except ValueError: |
| 483 | return None |
| 484 | |
| 485 | first_local_mac = None |
| 486 | for line in stdout: |
Victor Stinner | ebf6bb9 | 2020-03-17 18:36:44 +0100 | [diff] [blame] | 487 | words = line.rstrip().split() |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 488 | try: |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 489 | word = words[column_index] |
Victor Stinner | ebf6bb9 | 2020-03-17 18:36:44 +0100 | [diff] [blame] | 490 | except IndexError: |
| 491 | continue |
| 492 | |
| 493 | mac = _parse_mac(word) |
| 494 | if mac is None: |
| 495 | continue |
| 496 | if _is_universal(mac): |
| 497 | return mac |
| 498 | if first_local_mac is None: |
| 499 | first_local_mac = mac |
| 500 | |
| 501 | return first_local_mac |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 502 | |
| 503 | |
| 504 | # The following functions call external programs to 'get' a macaddr value to |
| 505 | # be used as basis for an uuid |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 506 | def _ifconfig_getnode(): |
| 507 | """Get the hardware address on Unix by running ifconfig.""" |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 508 | # This works on Linux ('' or '-a'), Tru64 ('-av'), but not all Unixes. |
Serhiy Storchaka | ee1a9a2 | 2017-11-04 09:37:32 +0200 | [diff] [blame] | 509 | keywords = (b'hwaddr', b'ether', b'address:', b'lladdr') |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 510 | for args in ('', '-a', '-av'): |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 511 | mac = _find_mac_near_keyword('ifconfig', args, keywords, lambda i: i+1) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 512 | if mac: |
| 513 | return mac |
Barry Warsaw | 23df2d1 | 2017-11-28 17:26:04 -0500 | [diff] [blame] | 514 | return None |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 515 | |
Serhiy Storchaka | ac4aa7b | 2014-11-30 20:39:04 +0200 | [diff] [blame] | 516 | def _ip_getnode(): |
| 517 | """Get the hardware address on Unix by running ip.""" |
| 518 | # This works on Linux with iproute2. |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 519 | mac = _find_mac_near_keyword('ip', 'link', [b'link/ether'], lambda i: i+1) |
Serhiy Storchaka | ac4aa7b | 2014-11-30 20:39:04 +0200 | [diff] [blame] | 520 | if mac: |
| 521 | return mac |
Barry Warsaw | 23df2d1 | 2017-11-28 17:26:04 -0500 | [diff] [blame] | 522 | return None |
Serhiy Storchaka | ac4aa7b | 2014-11-30 20:39:04 +0200 | [diff] [blame] | 523 | |
Serhiy Storchaka | e66bb96 | 2014-11-07 12:19:40 +0200 | [diff] [blame] | 524 | def _arp_getnode(): |
| 525 | """Get the hardware address on Unix by running arp.""" |
| 526 | import os, socket |
Serhiy Storchaka | 525d5ae | 2014-11-21 21:55:39 +0200 | [diff] [blame] | 527 | try: |
| 528 | ip_addr = socket.gethostbyname(socket.gethostname()) |
| 529 | except OSError: |
| 530 | return None |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 531 | |
| 532 | # Try getting the MAC addr from arp based on our IP address (Solaris). |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 533 | mac = _find_mac_near_keyword('arp', '-an', [os.fsencode(ip_addr)], lambda i: -1) |
Serhiy Storchaka | ee1a9a2 | 2017-11-04 09:37:32 +0200 | [diff] [blame] | 534 | if mac: |
| 535 | return mac |
| 536 | |
| 537 | # This works on OpenBSD |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 538 | mac = _find_mac_near_keyword('arp', '-an', [os.fsencode(ip_addr)], lambda i: i+1) |
Serhiy Storchaka | ee1a9a2 | 2017-11-04 09:37:32 +0200 | [diff] [blame] | 539 | if mac: |
| 540 | return mac |
| 541 | |
| 542 | # This works on Linux, FreeBSD and NetBSD |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 543 | mac = _find_mac_near_keyword('arp', '-an', [os.fsencode('(%s)' % ip_addr)], |
Serhiy Storchaka | ee1a9a2 | 2017-11-04 09:37:32 +0200 | [diff] [blame] | 544 | lambda i: i+2) |
Barry Warsaw | 23df2d1 | 2017-11-28 17:26:04 -0500 | [diff] [blame] | 545 | # Return None instead of 0. |
Serhiy Storchaka | ee1a9a2 | 2017-11-04 09:37:32 +0200 | [diff] [blame] | 546 | if mac: |
| 547 | return mac |
Barry Warsaw | 23df2d1 | 2017-11-28 17:26:04 -0500 | [diff] [blame] | 548 | return None |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 549 | |
Serhiy Storchaka | e66bb96 | 2014-11-07 12:19:40 +0200 | [diff] [blame] | 550 | def _lanscan_getnode(): |
| 551 | """Get the hardware address on Unix by running lanscan.""" |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 552 | # This might work on HP-UX. |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 553 | return _find_mac_near_keyword('lanscan', '-ai', [b'lan0'], lambda i: 0) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 554 | |
Serhiy Storchaka | e66bb96 | 2014-11-07 12:19:40 +0200 | [diff] [blame] | 555 | def _netstat_getnode(): |
| 556 | """Get the hardware address on Unix by running netstat.""" |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 557 | # This works on AIX and might work on Tru64 UNIX. |
| 558 | return _find_mac_under_heading('netstat', '-ian', b'Address') |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 559 | |
| 560 | def _ipconfig_getnode(): |
Steve Dower | d6b727e | 2020-05-12 23:32:32 +0100 | [diff] [blame] | 561 | """[DEPRECATED] Get the hardware address on Windows.""" |
| 562 | # bpo-40501: UuidCreateSequential() is now the only supported approach |
| 563 | return _windll_getnode() |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 564 | |
| 565 | def _netbios_getnode(): |
Steve Dower | d6b727e | 2020-05-12 23:32:32 +0100 | [diff] [blame] | 566 | """[DEPRECATED] Get the hardware address on Windows.""" |
| 567 | # bpo-40501: UuidCreateSequential() is now the only supported approach |
| 568 | return _windll_getnode() |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 569 | |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 570 | |
Antoine Pitrou | a106aec | 2017-09-28 23:03:06 +0200 | [diff] [blame] | 571 | # Import optional C extension at toplevel, to help disabling it when testing |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 572 | try: |
Antoine Pitrou | a106aec | 2017-09-28 23:03:06 +0200 | [diff] [blame] | 573 | import _uuid |
Steve Dower | d6b727e | 2020-05-12 23:32:32 +0100 | [diff] [blame] | 574 | _generate_time_safe = getattr(_uuid, "generate_time_safe", None) |
| 575 | _UuidCreate = getattr(_uuid, "UuidCreate", None) |
| 576 | _has_uuid_generate_time_safe = _uuid.has_uuid_generate_time_safe |
Antoine Pitrou | a106aec | 2017-09-28 23:03:06 +0200 | [diff] [blame] | 577 | except ImportError: |
| 578 | _uuid = None |
Steve Dower | d6b727e | 2020-05-12 23:32:32 +0100 | [diff] [blame] | 579 | _generate_time_safe = None |
| 580 | _UuidCreate = None |
| 581 | _has_uuid_generate_time_safe = None |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 582 | |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 583 | |
Antoine Pitrou | a106aec | 2017-09-28 23:03:06 +0200 | [diff] [blame] | 584 | def _load_system_functions(): |
Steve Dower | d6b727e | 2020-05-12 23:32:32 +0100 | [diff] [blame] | 585 | """[DEPRECATED] Platform-specific functions loaded at import time""" |
Antoine Pitrou | a106aec | 2017-09-28 23:03:06 +0200 | [diff] [blame] | 586 | |
| 587 | |
| 588 | def _unix_getnode(): |
Steve Dower | d6b727e | 2020-05-12 23:32:32 +0100 | [diff] [blame] | 589 | """Get the hardware address on Unix using the _uuid extension module.""" |
| 590 | if _generate_time_safe: |
| 591 | uuid_time, _ = _generate_time_safe() |
| 592 | return UUID(bytes=uuid_time).node |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 593 | |
| 594 | def _windll_getnode(): |
Steve Dower | d6b727e | 2020-05-12 23:32:32 +0100 | [diff] [blame] | 595 | """Get the hardware address on Windows using the _uuid extension module.""" |
| 596 | if _UuidCreate: |
| 597 | uuid_bytes = _UuidCreate() |
| 598 | return UUID(bytes_le=uuid_bytes).node |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 599 | |
| 600 | def _random_getnode(): |
Barry Warsaw | 23df2d1 | 2017-11-28 17:26:04 -0500 | [diff] [blame] | 601 | """Get a random node ID.""" |
| 602 | # RFC 4122, $4.1.6 says "For systems with no IEEE address, a randomly or |
| 603 | # pseudo-randomly generated value may be used; see Section 4.5. The |
| 604 | # multicast bit must be set in such addresses, in order that they will |
| 605 | # never conflict with addresses obtained from network cards." |
| 606 | # |
| 607 | # The "multicast bit" of a MAC address is defined to be "the least |
| 608 | # significant bit of the first octet". This works out to be the 41st bit |
| 609 | # counting from 1 being the least significant bit, or 1<<40. |
| 610 | # |
| 611 | # See https://en.wikipedia.org/wiki/MAC_address#Unicast_vs._multicast |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 612 | import random |
Barry Warsaw | 23df2d1 | 2017-11-28 17:26:04 -0500 | [diff] [blame] | 613 | return random.getrandbits(48) | (1 << 40) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 614 | |
Antoine Pitrou | a106aec | 2017-09-28 23:03:06 +0200 | [diff] [blame] | 615 | |
Min ho Kim | 39d87b5 | 2019-08-31 06:21:19 +1000 | [diff] [blame] | 616 | # _OS_GETTERS, when known, are targeted for a specific OS or platform. |
Michael Felt | 3a1d50e | 2019-06-15 17:52:29 +0200 | [diff] [blame] | 617 | # The order is by 'common practice' on the specified platform. |
| 618 | # Note: 'posix' and 'windows' _OS_GETTERS are prefixed by a dll/dlload() method |
| 619 | # which, when successful, means none of these "external" methods are called. |
| 620 | # _GETTERS is (also) used by test_uuid.py to SkipUnless(), e.g., |
| 621 | # @unittest.skipUnless(_uuid._ifconfig_getnode in _uuid._GETTERS, ...) |
| 622 | if _LINUX: |
| 623 | _OS_GETTERS = [_ip_getnode, _ifconfig_getnode] |
Steve Dower | bf2f76e | 2020-07-22 00:15:47 +0100 | [diff] [blame] | 624 | elif sys.platform == 'darwin': |
Michael Felt | 3a1d50e | 2019-06-15 17:52:29 +0200 | [diff] [blame] | 625 | _OS_GETTERS = [_ifconfig_getnode, _arp_getnode, _netstat_getnode] |
Steve Dower | bf2f76e | 2020-07-22 00:15:47 +0100 | [diff] [blame] | 626 | elif sys.platform == 'win32': |
Steve Dower | d6b727e | 2020-05-12 23:32:32 +0100 | [diff] [blame] | 627 | # bpo-40201: _windll_getnode will always succeed, so these are not needed |
| 628 | _OS_GETTERS = [] |
Michael Felt | 3a1d50e | 2019-06-15 17:52:29 +0200 | [diff] [blame] | 629 | elif _AIX: |
| 630 | _OS_GETTERS = [_netstat_getnode] |
| 631 | else: |
| 632 | _OS_GETTERS = [_ifconfig_getnode, _ip_getnode, _arp_getnode, |
| 633 | _netstat_getnode, _lanscan_getnode] |
| 634 | if os.name == 'posix': |
| 635 | _GETTERS = [_unix_getnode] + _OS_GETTERS |
| 636 | elif os.name == 'nt': |
| 637 | _GETTERS = [_windll_getnode] + _OS_GETTERS |
| 638 | else: |
| 639 | _GETTERS = _OS_GETTERS |
| 640 | |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 641 | _node = None |
| 642 | |
Shantanu | 8b6f652 | 2020-02-05 12:43:09 -0800 | [diff] [blame] | 643 | def getnode(): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 644 | """Get the hardware address as a 48-bit positive integer. |
| 645 | |
| 646 | The first time this runs, it may launch a separate program, which could |
| 647 | be quite slow. If all attempts to obtain the hardware address fail, we |
| 648 | choose a random 48-bit number with its eighth bit set to 1 as recommended |
| 649 | in RFC 4122. |
| 650 | """ |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 651 | global _node |
| 652 | if _node is not None: |
| 653 | return _node |
| 654 | |
Michael Felt | 3a1d50e | 2019-06-15 17:52:29 +0200 | [diff] [blame] | 655 | for getter in _GETTERS + [_random_getnode]: |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 656 | try: |
| 657 | _node = getter() |
| 658 | except: |
| 659 | continue |
Bo Bayles | 6b273f7 | 2018-01-23 19:11:44 -0600 | [diff] [blame] | 660 | if (_node is not None) and (0 <= _node < (1 << 48)): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 661 | return _node |
Bo Bayles | 6b273f7 | 2018-01-23 19:11:44 -0600 | [diff] [blame] | 662 | assert False, '_random_getnode() returned invalid value: {}'.format(_node) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 663 | |
Antoine Pitrou | a106aec | 2017-09-28 23:03:06 +0200 | [diff] [blame] | 664 | |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 665 | _last_timestamp = None |
| 666 | |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 667 | def uuid1(node=None, clock_seq=None): |
| 668 | """Generate a UUID from a host ID, sequence number, and the current time. |
| 669 | If 'node' is not given, getnode() is used to obtain the hardware |
| 670 | address. If 'clock_seq' is given, it is used as the sequence number; |
| 671 | otherwise a random 14-bit sequence number is chosen.""" |
| 672 | |
| 673 | # When the system provides a version-1 UUID generator, use it (but don't |
| 674 | # use UuidCreate here because its UUIDs don't conform to RFC 4122). |
Antoine Pitrou | a106aec | 2017-09-28 23:03:06 +0200 | [diff] [blame] | 675 | if _generate_time_safe is not None and node is clock_seq is None: |
| 676 | uuid_time, safely_generated = _generate_time_safe() |
Barry Warsaw | 8c130d7 | 2017-02-18 15:45:49 -0500 | [diff] [blame] | 677 | try: |
| 678 | is_safe = SafeUUID(safely_generated) |
| 679 | except ValueError: |
| 680 | is_safe = SafeUUID.unknown |
Antoine Pitrou | a106aec | 2017-09-28 23:03:06 +0200 | [diff] [blame] | 681 | return UUID(bytes=uuid_time, is_safe=is_safe) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 682 | |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 683 | global _last_timestamp |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 684 | import time |
Victor Stinner | 62a68b7 | 2018-12-18 11:45:13 +0100 | [diff] [blame] | 685 | nanoseconds = time.time_ns() |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 686 | # 0x01b21dd213814000 is the number of 100-ns intervals between the |
| 687 | # UUID epoch 1582-10-15 00:00:00 and the Unix epoch 1970-01-01 00:00:00. |
Victor Stinner | 62a68b7 | 2018-12-18 11:45:13 +0100 | [diff] [blame] | 688 | timestamp = nanoseconds // 100 + 0x01b21dd213814000 |
Guido van Rossum | 47b9ff6 | 2006-08-24 00:41:19 +0000 | [diff] [blame] | 689 | if _last_timestamp is not None and timestamp <= _last_timestamp: |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 690 | timestamp = _last_timestamp + 1 |
| 691 | _last_timestamp = timestamp |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 692 | if clock_seq is None: |
| 693 | import random |
Serhiy Storchaka | fa9be4f | 2014-09-06 22:14:04 +0300 | [diff] [blame] | 694 | clock_seq = random.getrandbits(14) # instead of stable storage |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 695 | time_low = timestamp & 0xffffffff |
| 696 | time_mid = (timestamp >> 32) & 0xffff |
| 697 | time_hi_version = (timestamp >> 48) & 0x0fff |
| 698 | clock_seq_low = clock_seq & 0xff |
| 699 | clock_seq_hi_variant = (clock_seq >> 8) & 0x3f |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 700 | if node is None: |
| 701 | node = getnode() |
| 702 | return UUID(fields=(time_low, time_mid, time_hi_version, |
| 703 | clock_seq_hi_variant, clock_seq_low, node), version=1) |
| 704 | |
| 705 | def uuid3(namespace, name): |
| 706 | """Generate a UUID from the MD5 hash of a namespace UUID and a name.""" |
Guido van Rossum | e7ba495 | 2007-06-06 23:52:48 +0000 | [diff] [blame] | 707 | from hashlib import md5 |
Christian Heimes | 7cad53e | 2019-09-13 02:30:00 +0200 | [diff] [blame] | 708 | digest = md5( |
| 709 | namespace.bytes + bytes(name, "utf-8"), |
| 710 | usedforsecurity=False |
| 711 | ).digest() |
| 712 | return UUID(bytes=digest[:16], version=3) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 713 | |
| 714 | def uuid4(): |
| 715 | """Generate a random UUID.""" |
Benjamin Peterson | 788cb52 | 2015-10-29 20:38:04 -0700 | [diff] [blame] | 716 | return UUID(bytes=os.urandom(16), version=4) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 717 | |
| 718 | def uuid5(namespace, name): |
| 719 | """Generate a UUID from the SHA-1 hash of a namespace UUID and a name.""" |
Guido van Rossum | e7ba495 | 2007-06-06 23:52:48 +0000 | [diff] [blame] | 720 | from hashlib import sha1 |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 721 | hash = sha1(namespace.bytes + bytes(name, "utf-8")).digest() |
Guido van Rossum | 5ed033b | 2007-07-09 14:29:40 +0000 | [diff] [blame] | 722 | return UUID(bytes=hash[:16], version=5) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 723 | |
| 724 | # The following standard UUIDs are for use with uuid3() or uuid5(). |
| 725 | |
| 726 | NAMESPACE_DNS = UUID('6ba7b810-9dad-11d1-80b4-00c04fd430c8') |
| 727 | NAMESPACE_URL = UUID('6ba7b811-9dad-11d1-80b4-00c04fd430c8') |
| 728 | NAMESPACE_OID = UUID('6ba7b812-9dad-11d1-80b4-00c04fd430c8') |
| 729 | NAMESPACE_X500 = UUID('6ba7b814-9dad-11d1-80b4-00c04fd430c8') |