Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1 | r"""UUID objects (universally unique identifiers) according to RFC 4122. |
| 2 | |
| 3 | This module provides immutable UUID objects (class UUID) and the functions |
| 4 | uuid1(), uuid3(), uuid4(), uuid5() for generating version 1, 3, 4, and 5 |
| 5 | UUIDs as specified in RFC 4122. |
| 6 | |
| 7 | If all you want is a unique ID, you should probably call uuid1() or uuid4(). |
| 8 | Note that uuid1() may compromise privacy since it creates a UUID containing |
| 9 | the computer's network address. uuid4() creates a random UUID. |
| 10 | |
| 11 | Typical usage: |
| 12 | |
| 13 | >>> import uuid |
| 14 | |
| 15 | # make a UUID based on the host ID and current time |
Georg Brandl | 1d523e1 | 2009-12-19 18:23:28 +0000 | [diff] [blame] | 16 | >>> uuid.uuid1() # doctest: +SKIP |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 17 | UUID('a8098c1a-f86e-11da-bd1a-00112444be1e') |
| 18 | |
| 19 | # make a UUID using an MD5 hash of a namespace UUID and a name |
| 20 | >>> uuid.uuid3(uuid.NAMESPACE_DNS, 'python.org') |
| 21 | UUID('6fa459ea-ee8a-3ca4-894e-db77e160355e') |
| 22 | |
| 23 | # make a random UUID |
Georg Brandl | 1d523e1 | 2009-12-19 18:23:28 +0000 | [diff] [blame] | 24 | >>> uuid.uuid4() # doctest: +SKIP |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 25 | UUID('16fd2706-8baf-433b-82eb-8c7fada847da') |
| 26 | |
| 27 | # make a UUID using a SHA-1 hash of a namespace UUID and a name |
| 28 | >>> uuid.uuid5(uuid.NAMESPACE_DNS, 'python.org') |
| 29 | UUID('886313e1-3b8a-5372-9b90-0c9aee199e5d') |
| 30 | |
| 31 | # make a UUID from a string of hex digits (braces and hyphens ignored) |
| 32 | >>> x = uuid.UUID('{00010203-0405-0607-0809-0a0b0c0d0e0f}') |
| 33 | |
| 34 | # convert a UUID to a string of hex digits in standard form |
| 35 | >>> str(x) |
| 36 | '00010203-0405-0607-0809-0a0b0c0d0e0f' |
| 37 | |
| 38 | # get the raw 16 bytes of the UUID |
| 39 | >>> x.bytes |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 40 | b'\x00\x01\x02\x03\x04\x05\x06\x07\x08\t\n\x0b\x0c\r\x0e\x0f' |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 41 | |
| 42 | # make a UUID from a 16-byte string |
| 43 | >>> uuid.UUID(bytes=x.bytes) |
| 44 | UUID('00010203-0405-0607-0809-0a0b0c0d0e0f') |
| 45 | """ |
| 46 | |
Benjamin Peterson | 788cb52 | 2015-10-29 20:38:04 -0700 | [diff] [blame] | 47 | import os |
Michael Felt | 3a1d50e | 2019-06-15 17:52:29 +0200 | [diff] [blame] | 48 | import platform |
Antoine Pitrou | a106aec | 2017-09-28 23:03:06 +0200 | [diff] [blame] | 49 | import sys |
Benjamin Peterson | 788cb52 | 2015-10-29 20:38:04 -0700 | [diff] [blame] | 50 | |
Barry Warsaw | 8c130d7 | 2017-02-18 15:45:49 -0500 | [diff] [blame] | 51 | from enum import Enum |
| 52 | |
| 53 | |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 54 | __author__ = 'Ka-Ping Yee <ping@zesty.ca>' |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 55 | |
Michael Felt | 3a1d50e | 2019-06-15 17:52:29 +0200 | [diff] [blame] | 56 | # The recognized platforms - known behaviors |
| 57 | _AIX = platform.system() == 'AIX' |
| 58 | _DARWIN = platform.system() == 'Darwin' |
| 59 | _LINUX = platform.system() == 'Linux' |
| 60 | _WINDOWS = platform.system() == 'Windows' |
| 61 | |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 62 | _MAC_DELIM = b':' |
| 63 | _MAC_OMITS_LEADING_ZEROES = False |
| 64 | if _AIX: |
| 65 | _MAC_DELIM = b'.' |
| 66 | _MAC_OMITS_LEADING_ZEROES = True |
| 67 | |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 68 | RESERVED_NCS, RFC_4122, RESERVED_MICROSOFT, RESERVED_FUTURE = [ |
| 69 | 'reserved for NCS compatibility', 'specified in RFC 4122', |
| 70 | 'reserved for Microsoft compatibility', 'reserved for future definition'] |
| 71 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 72 | int_ = int # The built-in int type |
| 73 | bytes_ = bytes # The built-in bytes type |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 74 | |
Barry Warsaw | 8c130d7 | 2017-02-18 15:45:49 -0500 | [diff] [blame] | 75 | |
| 76 | class SafeUUID(Enum): |
| 77 | safe = 0 |
| 78 | unsafe = -1 |
| 79 | unknown = None |
| 80 | |
| 81 | |
| 82 | class UUID: |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 83 | """Instances of the UUID class represent UUIDs as specified in RFC 4122. |
| 84 | UUID objects are immutable, hashable, and usable as dictionary keys. |
| 85 | Converting a UUID to a string with str() yields something in the form |
| 86 | '12345678-1234-1234-1234-123456789abc'. The UUID constructor accepts |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 87 | five possible forms: a similar string of hexadecimal digits, or a tuple |
| 88 | of six integer fields (with 32-bit, 16-bit, 16-bit, 8-bit, 8-bit, and |
| 89 | 48-bit values respectively) as an argument named 'fields', or a string |
| 90 | of 16 bytes (with all the integer fields in big-endian order) as an |
| 91 | argument named 'bytes', or a string of 16 bytes (with the first three |
| 92 | fields in little-endian order) as an argument named 'bytes_le', or a |
| 93 | single 128-bit integer as an argument named 'int'. |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 94 | |
| 95 | UUIDs have these read-only attributes: |
| 96 | |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 97 | bytes the UUID as a 16-byte string (containing the six |
| 98 | integer fields in big-endian byte order) |
| 99 | |
| 100 | bytes_le the UUID as a 16-byte string (with time_low, time_mid, |
| 101 | and time_hi_version in little-endian byte order) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 102 | |
| 103 | fields a tuple of the six integer fields of the UUID, |
| 104 | which are also available as six individual attributes |
| 105 | and two derived attributes: |
| 106 | |
| 107 | time_low the first 32 bits of the UUID |
| 108 | time_mid the next 16 bits of the UUID |
| 109 | time_hi_version the next 16 bits of the UUID |
| 110 | clock_seq_hi_variant the next 8 bits of the UUID |
| 111 | clock_seq_low the next 8 bits of the UUID |
| 112 | node the last 48 bits of the UUID |
| 113 | |
| 114 | time the 60-bit timestamp |
| 115 | clock_seq the 14-bit sequence number |
| 116 | |
| 117 | hex the UUID as a 32-character hexadecimal string |
| 118 | |
| 119 | int the UUID as a 128-bit integer |
| 120 | |
| 121 | urn the UUID as a URN as specified in RFC 4122 |
| 122 | |
| 123 | variant the UUID variant (one of the constants RESERVED_NCS, |
| 124 | RFC_4122, RESERVED_MICROSOFT, or RESERVED_FUTURE) |
| 125 | |
| 126 | version the UUID version number (1 through 5, meaningful only |
| 127 | when the variant is RFC_4122) |
Barry Warsaw | 8c130d7 | 2017-02-18 15:45:49 -0500 | [diff] [blame] | 128 | |
| 129 | is_safe An enum indicating whether the UUID has been generated in |
| 130 | a way that is safe for multiprocessing applications, via |
| 131 | uuid_generate_time_safe(3). |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 132 | """ |
| 133 | |
David H | f1d8e7c | 2019-01-17 13:16:51 +0100 | [diff] [blame] | 134 | __slots__ = ('int', 'is_safe', '__weakref__') |
Tal Einat | 3e2b29d | 2018-09-06 14:34:25 +0300 | [diff] [blame] | 135 | |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 136 | def __init__(self, hex=None, bytes=None, bytes_le=None, fields=None, |
Barry Warsaw | 8c130d7 | 2017-02-18 15:45:49 -0500 | [diff] [blame] | 137 | int=None, version=None, |
| 138 | *, is_safe=SafeUUID.unknown): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 139 | r"""Create a UUID from either a string of 32 hexadecimal digits, |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 140 | a string of 16 bytes as the 'bytes' argument, a string of 16 bytes |
| 141 | in little-endian order as the 'bytes_le' argument, a tuple of six |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 142 | integers (32-bit time_low, 16-bit time_mid, 16-bit time_hi_version, |
| 143 | 8-bit clock_seq_hi_variant, 8-bit clock_seq_low, 48-bit node) as |
| 144 | the 'fields' argument, or a single 128-bit integer as the 'int' |
| 145 | argument. When a string of hex digits is given, curly braces, |
| 146 | hyphens, and a URN prefix are all optional. For example, these |
| 147 | expressions all yield the same UUID: |
| 148 | |
| 149 | UUID('{12345678-1234-5678-1234-567812345678}') |
| 150 | UUID('12345678123456781234567812345678') |
| 151 | UUID('urn:uuid:12345678-1234-5678-1234-567812345678') |
| 152 | UUID(bytes='\x12\x34\x56\x78'*4) |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 153 | UUID(bytes_le='\x78\x56\x34\x12\x34\x12\x78\x56' + |
| 154 | '\x12\x34\x56\x78\x12\x34\x56\x78') |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 155 | UUID(fields=(0x12345678, 0x1234, 0x5678, 0x12, 0x34, 0x567812345678)) |
| 156 | UUID(int=0x12345678123456781234567812345678) |
| 157 | |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 158 | Exactly one of 'hex', 'bytes', 'bytes_le', 'fields', or 'int' must |
| 159 | be given. The 'version' argument is optional; if given, the resulting |
| 160 | UUID will have its variant and version set according to RFC 4122, |
| 161 | overriding the given 'hex', 'bytes', 'bytes_le', 'fields', or 'int'. |
Barry Warsaw | 8c130d7 | 2017-02-18 15:45:49 -0500 | [diff] [blame] | 162 | |
| 163 | is_safe is an enum exposed as an attribute on the instance. It |
| 164 | indicates whether the UUID has been generated in a way that is safe |
| 165 | for multiprocessing applications, via uuid_generate_time_safe(3). |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 166 | """ |
| 167 | |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 168 | if [hex, bytes, bytes_le, fields, int].count(None) != 4: |
Berker Peksag | d02eb8a | 2016-03-20 16:49:10 +0200 | [diff] [blame] | 169 | raise TypeError('one of the hex, bytes, bytes_le, fields, ' |
| 170 | 'or int arguments must be given') |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 171 | if hex is not None: |
| 172 | hex = hex.replace('urn:', '').replace('uuid:', '') |
| 173 | hex = hex.strip('{}').replace('-', '') |
| 174 | if len(hex) != 32: |
| 175 | raise ValueError('badly formed hexadecimal UUID string') |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 176 | int = int_(hex, 16) |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 177 | if bytes_le is not None: |
| 178 | if len(bytes_le) != 16: |
| 179 | raise ValueError('bytes_le is not a 16-char string') |
Serhiy Storchaka | fa9be4f | 2014-09-06 22:14:04 +0300 | [diff] [blame] | 180 | bytes = (bytes_le[4-1::-1] + bytes_le[6-1:4-1:-1] + |
| 181 | bytes_le[8-1:6-1:-1] + bytes_le[8:]) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 182 | if bytes is not None: |
| 183 | if len(bytes) != 16: |
| 184 | raise ValueError('bytes is not a 16-char string') |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 185 | assert isinstance(bytes, bytes_), repr(bytes) |
Philip Jenvey | 1221f6b | 2013-08-29 18:33:50 -0700 | [diff] [blame] | 186 | int = int_.from_bytes(bytes, byteorder='big') |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 187 | if fields is not None: |
| 188 | if len(fields) != 6: |
| 189 | raise ValueError('fields is not a 6-tuple') |
| 190 | (time_low, time_mid, time_hi_version, |
| 191 | clock_seq_hi_variant, clock_seq_low, node) = fields |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 192 | if not 0 <= time_low < 1<<32: |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 193 | raise ValueError('field 1 out of range (need a 32-bit value)') |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 194 | if not 0 <= time_mid < 1<<16: |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 195 | raise ValueError('field 2 out of range (need a 16-bit value)') |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 196 | if not 0 <= time_hi_version < 1<<16: |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 197 | raise ValueError('field 3 out of range (need a 16-bit value)') |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 198 | if not 0 <= clock_seq_hi_variant < 1<<8: |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 199 | raise ValueError('field 4 out of range (need an 8-bit value)') |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 200 | if not 0 <= clock_seq_low < 1<<8: |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 201 | raise ValueError('field 5 out of range (need an 8-bit value)') |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 202 | if not 0 <= node < 1<<48: |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 203 | raise ValueError('field 6 out of range (need a 48-bit value)') |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 204 | clock_seq = (clock_seq_hi_variant << 8) | clock_seq_low |
| 205 | int = ((time_low << 96) | (time_mid << 80) | |
| 206 | (time_hi_version << 64) | (clock_seq << 48) | node) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 207 | if int is not None: |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 208 | if not 0 <= int < 1<<128: |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 209 | raise ValueError('int is out of range (need a 128-bit value)') |
| 210 | if version is not None: |
| 211 | if not 1 <= version <= 5: |
| 212 | raise ValueError('illegal version number') |
| 213 | # Set the variant to RFC 4122. |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 214 | int &= ~(0xc000 << 48) |
| 215 | int |= 0x8000 << 48 |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 216 | # Set the version number. |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 217 | int &= ~(0xf000 << 64) |
| 218 | int |= version << 76 |
Tal Einat | 3e2b29d | 2018-09-06 14:34:25 +0300 | [diff] [blame] | 219 | object.__setattr__(self, 'int', int) |
| 220 | object.__setattr__(self, 'is_safe', is_safe) |
| 221 | |
| 222 | def __getstate__(self): |
Tal Einat | 5475253 | 2018-09-10 16:11:04 +0300 | [diff] [blame] | 223 | d = {'int': self.int} |
| 224 | if self.is_safe != SafeUUID.unknown: |
| 225 | # is_safe is a SafeUUID instance. Return just its value, so that |
| 226 | # it can be un-pickled in older Python versions without SafeUUID. |
| 227 | d['is_safe'] = self.is_safe.value |
Tal Einat | 3e2b29d | 2018-09-06 14:34:25 +0300 | [diff] [blame] | 228 | return d |
| 229 | |
| 230 | def __setstate__(self, state): |
Tal Einat | 5475253 | 2018-09-10 16:11:04 +0300 | [diff] [blame] | 231 | object.__setattr__(self, 'int', state['int']) |
| 232 | # is_safe was added in 3.7; it is also omitted when it is "unknown" |
| 233 | object.__setattr__(self, 'is_safe', |
| 234 | SafeUUID(state['is_safe']) |
| 235 | if 'is_safe' in state else SafeUUID.unknown) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 236 | |
Guido van Rossum | 47b9ff6 | 2006-08-24 00:41:19 +0000 | [diff] [blame] | 237 | def __eq__(self, other): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 238 | if isinstance(other, UUID): |
Guido van Rossum | 47b9ff6 | 2006-08-24 00:41:19 +0000 | [diff] [blame] | 239 | return self.int == other.int |
| 240 | return NotImplemented |
| 241 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 242 | # Q. What's the value of being able to sort UUIDs? |
| 243 | # A. Use them as keys in a B-Tree or similar mapping. |
Guido van Rossum | 47b9ff6 | 2006-08-24 00:41:19 +0000 | [diff] [blame] | 244 | |
| 245 | def __lt__(self, other): |
| 246 | if isinstance(other, UUID): |
| 247 | return self.int < other.int |
| 248 | return NotImplemented |
| 249 | |
| 250 | def __gt__(self, other): |
| 251 | if isinstance(other, UUID): |
| 252 | return self.int > other.int |
| 253 | return NotImplemented |
| 254 | |
| 255 | def __le__(self, other): |
| 256 | if isinstance(other, UUID): |
| 257 | return self.int <= other.int |
| 258 | return NotImplemented |
| 259 | |
| 260 | def __ge__(self, other): |
| 261 | if isinstance(other, UUID): |
| 262 | return self.int >= other.int |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 263 | return NotImplemented |
| 264 | |
| 265 | def __hash__(self): |
| 266 | return hash(self.int) |
| 267 | |
| 268 | def __int__(self): |
| 269 | return self.int |
| 270 | |
| 271 | def __repr__(self): |
Serhiy Storchaka | 465e60e | 2014-07-25 23:36:00 +0300 | [diff] [blame] | 272 | return '%s(%r)' % (self.__class__.__name__, str(self)) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 273 | |
| 274 | def __setattr__(self, name, value): |
| 275 | raise TypeError('UUID objects are immutable') |
| 276 | |
| 277 | def __str__(self): |
| 278 | hex = '%032x' % self.int |
| 279 | return '%s-%s-%s-%s-%s' % ( |
| 280 | hex[:8], hex[8:12], hex[12:16], hex[16:20], hex[20:]) |
| 281 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 282 | @property |
| 283 | def bytes(self): |
Serhiy Storchaka | fa9be4f | 2014-09-06 22:14:04 +0300 | [diff] [blame] | 284 | return self.int.to_bytes(16, 'big') |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 285 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 286 | @property |
| 287 | def bytes_le(self): |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 288 | bytes = self.bytes |
Serhiy Storchaka | fa9be4f | 2014-09-06 22:14:04 +0300 | [diff] [blame] | 289 | return (bytes[4-1::-1] + bytes[6-1:4-1:-1] + bytes[8-1:6-1:-1] + |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 290 | bytes[8:]) |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 291 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 292 | @property |
| 293 | def fields(self): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 294 | return (self.time_low, self.time_mid, self.time_hi_version, |
| 295 | self.clock_seq_hi_variant, self.clock_seq_low, self.node) |
| 296 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 297 | @property |
| 298 | def time_low(self): |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 299 | return self.int >> 96 |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 300 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 301 | @property |
| 302 | def time_mid(self): |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 303 | return (self.int >> 80) & 0xffff |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 304 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 305 | @property |
| 306 | def time_hi_version(self): |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 307 | return (self.int >> 64) & 0xffff |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 308 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 309 | @property |
| 310 | def clock_seq_hi_variant(self): |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 311 | return (self.int >> 56) & 0xff |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 312 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 313 | @property |
| 314 | def clock_seq_low(self): |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 315 | return (self.int >> 48) & 0xff |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 316 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 317 | @property |
| 318 | def time(self): |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 319 | return (((self.time_hi_version & 0x0fff) << 48) | |
| 320 | (self.time_mid << 32) | self.time_low) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 321 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 322 | @property |
| 323 | def clock_seq(self): |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 324 | return (((self.clock_seq_hi_variant & 0x3f) << 8) | |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 325 | self.clock_seq_low) |
| 326 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 327 | @property |
| 328 | def node(self): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 329 | return self.int & 0xffffffffffff |
| 330 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 331 | @property |
| 332 | def hex(self): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 333 | return '%032x' % self.int |
| 334 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 335 | @property |
| 336 | def urn(self): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 337 | return 'urn:uuid:' + str(self) |
| 338 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 339 | @property |
| 340 | def variant(self): |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 341 | if not self.int & (0x8000 << 48): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 342 | return RESERVED_NCS |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 343 | elif not self.int & (0x4000 << 48): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 344 | return RFC_4122 |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 345 | elif not self.int & (0x2000 << 48): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 346 | return RESERVED_MICROSOFT |
| 347 | else: |
| 348 | return RESERVED_FUTURE |
| 349 | |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 350 | @property |
| 351 | def version(self): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 352 | # The version bits are only meaningful for RFC 4122 UUIDs. |
| 353 | if self.variant == RFC_4122: |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 354 | return int((self.int >> 76) & 0xf) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 355 | |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 356 | |
| 357 | def _get_command_stdout(command, *args): |
| 358 | import io, os, shutil, subprocess |
| 359 | |
| 360 | try: |
| 361 | path_dirs = os.environ.get('PATH', os.defpath).split(os.pathsep) |
| 362 | path_dirs.extend(['/sbin', '/usr/sbin']) |
| 363 | executable = shutil.which(command, path=os.pathsep.join(path_dirs)) |
R David Murray | 4be1e24 | 2013-12-17 21:13:16 -0500 | [diff] [blame] | 364 | if executable is None: |
| 365 | return None |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 366 | # LC_ALL=C to ensure English output, stderr=DEVNULL to prevent output |
| 367 | # on stderr (Note: we don't have an example where the words we search |
| 368 | # for are actually localized, but in theory some system could do so.) |
| 369 | env = dict(os.environ) |
| 370 | env['LC_ALL'] = 'C' |
| 371 | proc = subprocess.Popen((executable,) + args, |
| 372 | stdout=subprocess.PIPE, |
| 373 | stderr=subprocess.DEVNULL, |
| 374 | env=env) |
| 375 | if not proc: |
| 376 | return None |
| 377 | stdout, stderr = proc.communicate() |
| 378 | return io.BytesIO(stdout) |
| 379 | except (OSError, subprocess.SubprocessError): |
| 380 | return None |
| 381 | |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 382 | |
Barry Warsaw | 23df2d1 | 2017-11-28 17:26:04 -0500 | [diff] [blame] | 383 | # For MAC (a.k.a. IEEE 802, or EUI-48) addresses, the second least significant |
| 384 | # bit of the first octet signifies whether the MAC address is universally (0) |
| 385 | # or locally (1) administered. Network cards from hardware manufacturers will |
| 386 | # always be universally administered to guarantee global uniqueness of the MAC |
| 387 | # address, but any particular machine may have other interfaces which are |
| 388 | # locally administered. An example of the latter is the bridge interface to |
| 389 | # the Touch Bar on MacBook Pros. |
| 390 | # |
| 391 | # This bit works out to be the 42nd bit counting from 1 being the least |
| 392 | # significant, or 1<<41. We'll prefer universally administered MAC addresses |
| 393 | # over locally administered ones since the former are globally unique, but |
| 394 | # we'll return the first of the latter found if that's all the machine has. |
| 395 | # |
| 396 | # See https://en.wikipedia.org/wiki/MAC_address#Universal_vs._local |
| 397 | |
| 398 | def _is_universal(mac): |
| 399 | return not (mac & (1 << 41)) |
| 400 | |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 401 | |
| 402 | def _find_mac_near_keyword(command, args, keywords, get_word_index): |
| 403 | """Searches a command's output for a MAC address near a keyword. |
| 404 | |
| 405 | Each line of words in the output is case-insensitively searched for |
| 406 | any of the given keywords. Upon a match, get_word_index is invoked |
| 407 | to pick a word from the line, given the index of the match. For |
| 408 | example, lambda i: 0 would get the first word on the line, while |
| 409 | lambda i: i - 1 would get the word preceding the keyword. |
| 410 | """ |
| 411 | stdout = _get_command_stdout(command, args) |
| 412 | if stdout is None: |
| 413 | return None |
| 414 | |
Barry Warsaw | 23df2d1 | 2017-11-28 17:26:04 -0500 | [diff] [blame] | 415 | first_local_mac = None |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 416 | for line in stdout: |
| 417 | words = line.lower().rstrip().split() |
| 418 | for i in range(len(words)): |
| 419 | if words[i] in keywords: |
| 420 | try: |
| 421 | word = words[get_word_index(i)] |
| 422 | mac = int(word.replace(_MAC_DELIM, b''), 16) |
| 423 | except (ValueError, IndexError): |
| 424 | # Virtual interfaces, such as those provided by |
| 425 | # VPNs, do not have a colon-delimited MAC address |
| 426 | # as expected, but a 16-byte HWAddr separated by |
| 427 | # dashes. These should be ignored in favor of a |
| 428 | # real MAC address |
| 429 | pass |
| 430 | else: |
| 431 | if _is_universal(mac): |
| 432 | return mac |
| 433 | first_local_mac = first_local_mac or mac |
Barry Warsaw | 23df2d1 | 2017-11-28 17:26:04 -0500 | [diff] [blame] | 434 | return first_local_mac or None |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 435 | |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 436 | |
Victor Stinner | ebf6bb9 | 2020-03-17 18:36:44 +0100 | [diff] [blame] | 437 | def _parse_mac(word): |
| 438 | # Accept 'HH:HH:HH:HH:HH:HH' MAC address (ex: '52:54:00:9d:0e:67'), |
| 439 | # but reject IPv6 address (ex: 'fe80::5054:ff:fe9' or '123:2:3:4:5:6:7:8'). |
| 440 | # |
| 441 | # Virtual interfaces, such as those provided by VPNs, do not have a |
| 442 | # colon-delimited MAC address as expected, but a 16-byte HWAddr separated |
| 443 | # by dashes. These should be ignored in favor of a real MAC address |
| 444 | parts = word.split(_MAC_DELIM) |
| 445 | if len(parts) != 6: |
| 446 | return |
| 447 | if _MAC_OMITS_LEADING_ZEROES: |
| 448 | # (Only) on AIX the macaddr value given is not prefixed by 0, e.g. |
| 449 | # en0 1500 link#2 fa.bc.de.f7.62.4 110854824 0 160133733 0 0 |
| 450 | # not |
| 451 | # en0 1500 link#2 fa.bc.de.f7.62.04 110854824 0 160133733 0 0 |
| 452 | if not all(1 <= len(part) <= 2 for part in parts): |
| 453 | return |
| 454 | hexstr = b''.join(part.rjust(2, b'0') for part in parts) |
| 455 | else: |
| 456 | if not all(len(part) == 2 for part in parts): |
| 457 | return |
| 458 | hexstr = b''.join(parts) |
| 459 | try: |
| 460 | return int(hexstr, 16) |
| 461 | except ValueError: |
| 462 | return |
| 463 | |
| 464 | |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 465 | def _find_mac_under_heading(command, args, heading): |
| 466 | """Looks for a MAC address under a heading in a command's output. |
| 467 | |
| 468 | The first line of words in the output is searched for the given |
| 469 | heading. Words at the same word index as the heading in subsequent |
| 470 | lines are then examined to see if they look like MAC addresses. |
| 471 | """ |
| 472 | stdout = _get_command_stdout(command, args) |
| 473 | if stdout is None: |
| 474 | return None |
| 475 | |
| 476 | keywords = stdout.readline().rstrip().split() |
| 477 | try: |
| 478 | column_index = keywords.index(heading) |
| 479 | except ValueError: |
| 480 | return None |
| 481 | |
| 482 | first_local_mac = None |
| 483 | for line in stdout: |
Victor Stinner | ebf6bb9 | 2020-03-17 18:36:44 +0100 | [diff] [blame] | 484 | words = line.rstrip().split() |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 485 | try: |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 486 | word = words[column_index] |
Victor Stinner | ebf6bb9 | 2020-03-17 18:36:44 +0100 | [diff] [blame] | 487 | except IndexError: |
| 488 | continue |
| 489 | |
| 490 | mac = _parse_mac(word) |
| 491 | if mac is None: |
| 492 | continue |
| 493 | if _is_universal(mac): |
| 494 | return mac |
| 495 | if first_local_mac is None: |
| 496 | first_local_mac = mac |
| 497 | |
| 498 | return first_local_mac |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 499 | |
| 500 | |
| 501 | # The following functions call external programs to 'get' a macaddr value to |
| 502 | # be used as basis for an uuid |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 503 | def _ifconfig_getnode(): |
| 504 | """Get the hardware address on Unix by running ifconfig.""" |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 505 | # This works on Linux ('' or '-a'), Tru64 ('-av'), but not all Unixes. |
Serhiy Storchaka | ee1a9a2 | 2017-11-04 09:37:32 +0200 | [diff] [blame] | 506 | keywords = (b'hwaddr', b'ether', b'address:', b'lladdr') |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 507 | for args in ('', '-a', '-av'): |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 508 | mac = _find_mac_near_keyword('ifconfig', args, keywords, lambda i: i+1) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 509 | if mac: |
| 510 | return mac |
Barry Warsaw | 23df2d1 | 2017-11-28 17:26:04 -0500 | [diff] [blame] | 511 | return None |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 512 | |
Serhiy Storchaka | ac4aa7b | 2014-11-30 20:39:04 +0200 | [diff] [blame] | 513 | def _ip_getnode(): |
| 514 | """Get the hardware address on Unix by running ip.""" |
| 515 | # This works on Linux with iproute2. |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 516 | mac = _find_mac_near_keyword('ip', 'link', [b'link/ether'], lambda i: i+1) |
Serhiy Storchaka | ac4aa7b | 2014-11-30 20:39:04 +0200 | [diff] [blame] | 517 | if mac: |
| 518 | return mac |
Barry Warsaw | 23df2d1 | 2017-11-28 17:26:04 -0500 | [diff] [blame] | 519 | return None |
Serhiy Storchaka | ac4aa7b | 2014-11-30 20:39:04 +0200 | [diff] [blame] | 520 | |
Serhiy Storchaka | e66bb96 | 2014-11-07 12:19:40 +0200 | [diff] [blame] | 521 | def _arp_getnode(): |
| 522 | """Get the hardware address on Unix by running arp.""" |
| 523 | import os, socket |
Serhiy Storchaka | 525d5ae | 2014-11-21 21:55:39 +0200 | [diff] [blame] | 524 | try: |
| 525 | ip_addr = socket.gethostbyname(socket.gethostname()) |
| 526 | except OSError: |
| 527 | return None |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 528 | |
| 529 | # Try getting the MAC addr from arp based on our IP address (Solaris). |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 530 | mac = _find_mac_near_keyword('arp', '-an', [os.fsencode(ip_addr)], lambda i: -1) |
Serhiy Storchaka | ee1a9a2 | 2017-11-04 09:37:32 +0200 | [diff] [blame] | 531 | if mac: |
| 532 | return mac |
| 533 | |
| 534 | # This works on OpenBSD |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 535 | mac = _find_mac_near_keyword('arp', '-an', [os.fsencode(ip_addr)], lambda i: i+1) |
Serhiy Storchaka | ee1a9a2 | 2017-11-04 09:37:32 +0200 | [diff] [blame] | 536 | if mac: |
| 537 | return mac |
| 538 | |
| 539 | # This works on Linux, FreeBSD and NetBSD |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 540 | mac = _find_mac_near_keyword('arp', '-an', [os.fsencode('(%s)' % ip_addr)], |
Serhiy Storchaka | ee1a9a2 | 2017-11-04 09:37:32 +0200 | [diff] [blame] | 541 | lambda i: i+2) |
Barry Warsaw | 23df2d1 | 2017-11-28 17:26:04 -0500 | [diff] [blame] | 542 | # Return None instead of 0. |
Serhiy Storchaka | ee1a9a2 | 2017-11-04 09:37:32 +0200 | [diff] [blame] | 543 | if mac: |
| 544 | return mac |
Barry Warsaw | 23df2d1 | 2017-11-28 17:26:04 -0500 | [diff] [blame] | 545 | return None |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 546 | |
Serhiy Storchaka | e66bb96 | 2014-11-07 12:19:40 +0200 | [diff] [blame] | 547 | def _lanscan_getnode(): |
| 548 | """Get the hardware address on Unix by running lanscan.""" |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 549 | # This might work on HP-UX. |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 550 | return _find_mac_near_keyword('lanscan', '-ai', [b'lan0'], lambda i: 0) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 551 | |
Serhiy Storchaka | e66bb96 | 2014-11-07 12:19:40 +0200 | [diff] [blame] | 552 | def _netstat_getnode(): |
| 553 | """Get the hardware address on Unix by running netstat.""" |
Michael Felt | 0bcbfa4 | 2019-09-26 20:43:15 +0100 | [diff] [blame] | 554 | # This works on AIX and might work on Tru64 UNIX. |
| 555 | return _find_mac_under_heading('netstat', '-ian', b'Address') |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 556 | |
| 557 | def _ipconfig_getnode(): |
Steve Dower | d6b727e | 2020-05-12 23:32:32 +0100 | [diff] [blame^] | 558 | """[DEPRECATED] Get the hardware address on Windows.""" |
| 559 | # bpo-40501: UuidCreateSequential() is now the only supported approach |
| 560 | return _windll_getnode() |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 561 | |
| 562 | def _netbios_getnode(): |
Steve Dower | d6b727e | 2020-05-12 23:32:32 +0100 | [diff] [blame^] | 563 | """[DEPRECATED] Get the hardware address on Windows.""" |
| 564 | # bpo-40501: UuidCreateSequential() is now the only supported approach |
| 565 | return _windll_getnode() |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 566 | |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 567 | |
Antoine Pitrou | a106aec | 2017-09-28 23:03:06 +0200 | [diff] [blame] | 568 | # Import optional C extension at toplevel, to help disabling it when testing |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 569 | try: |
Antoine Pitrou | a106aec | 2017-09-28 23:03:06 +0200 | [diff] [blame] | 570 | import _uuid |
Steve Dower | d6b727e | 2020-05-12 23:32:32 +0100 | [diff] [blame^] | 571 | _generate_time_safe = getattr(_uuid, "generate_time_safe", None) |
| 572 | _UuidCreate = getattr(_uuid, "UuidCreate", None) |
| 573 | _has_uuid_generate_time_safe = _uuid.has_uuid_generate_time_safe |
Antoine Pitrou | a106aec | 2017-09-28 23:03:06 +0200 | [diff] [blame] | 574 | except ImportError: |
| 575 | _uuid = None |
Steve Dower | d6b727e | 2020-05-12 23:32:32 +0100 | [diff] [blame^] | 576 | _generate_time_safe = None |
| 577 | _UuidCreate = None |
| 578 | _has_uuid_generate_time_safe = None |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 579 | |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 580 | |
Antoine Pitrou | a106aec | 2017-09-28 23:03:06 +0200 | [diff] [blame] | 581 | def _load_system_functions(): |
Steve Dower | d6b727e | 2020-05-12 23:32:32 +0100 | [diff] [blame^] | 582 | """[DEPRECATED] Platform-specific functions loaded at import time""" |
Antoine Pitrou | a106aec | 2017-09-28 23:03:06 +0200 | [diff] [blame] | 583 | |
| 584 | |
| 585 | def _unix_getnode(): |
Steve Dower | d6b727e | 2020-05-12 23:32:32 +0100 | [diff] [blame^] | 586 | """Get the hardware address on Unix using the _uuid extension module.""" |
| 587 | if _generate_time_safe: |
| 588 | uuid_time, _ = _generate_time_safe() |
| 589 | return UUID(bytes=uuid_time).node |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 590 | |
| 591 | def _windll_getnode(): |
Steve Dower | d6b727e | 2020-05-12 23:32:32 +0100 | [diff] [blame^] | 592 | """Get the hardware address on Windows using the _uuid extension module.""" |
| 593 | if _UuidCreate: |
| 594 | uuid_bytes = _UuidCreate() |
| 595 | return UUID(bytes_le=uuid_bytes).node |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 596 | |
| 597 | def _random_getnode(): |
Barry Warsaw | 23df2d1 | 2017-11-28 17:26:04 -0500 | [diff] [blame] | 598 | """Get a random node ID.""" |
| 599 | # RFC 4122, $4.1.6 says "For systems with no IEEE address, a randomly or |
| 600 | # pseudo-randomly generated value may be used; see Section 4.5. The |
| 601 | # multicast bit must be set in such addresses, in order that they will |
| 602 | # never conflict with addresses obtained from network cards." |
| 603 | # |
| 604 | # The "multicast bit" of a MAC address is defined to be "the least |
| 605 | # significant bit of the first octet". This works out to be the 41st bit |
| 606 | # counting from 1 being the least significant bit, or 1<<40. |
| 607 | # |
| 608 | # See https://en.wikipedia.org/wiki/MAC_address#Unicast_vs._multicast |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 609 | import random |
Barry Warsaw | 23df2d1 | 2017-11-28 17:26:04 -0500 | [diff] [blame] | 610 | return random.getrandbits(48) | (1 << 40) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 611 | |
Antoine Pitrou | a106aec | 2017-09-28 23:03:06 +0200 | [diff] [blame] | 612 | |
Min ho Kim | 39d87b5 | 2019-08-31 06:21:19 +1000 | [diff] [blame] | 613 | # _OS_GETTERS, when known, are targeted for a specific OS or platform. |
Michael Felt | 3a1d50e | 2019-06-15 17:52:29 +0200 | [diff] [blame] | 614 | # The order is by 'common practice' on the specified platform. |
| 615 | # Note: 'posix' and 'windows' _OS_GETTERS are prefixed by a dll/dlload() method |
| 616 | # which, when successful, means none of these "external" methods are called. |
| 617 | # _GETTERS is (also) used by test_uuid.py to SkipUnless(), e.g., |
| 618 | # @unittest.skipUnless(_uuid._ifconfig_getnode in _uuid._GETTERS, ...) |
| 619 | if _LINUX: |
| 620 | _OS_GETTERS = [_ip_getnode, _ifconfig_getnode] |
| 621 | elif _DARWIN: |
| 622 | _OS_GETTERS = [_ifconfig_getnode, _arp_getnode, _netstat_getnode] |
| 623 | elif _WINDOWS: |
Steve Dower | d6b727e | 2020-05-12 23:32:32 +0100 | [diff] [blame^] | 624 | # bpo-40201: _windll_getnode will always succeed, so these are not needed |
| 625 | _OS_GETTERS = [] |
Michael Felt | 3a1d50e | 2019-06-15 17:52:29 +0200 | [diff] [blame] | 626 | elif _AIX: |
| 627 | _OS_GETTERS = [_netstat_getnode] |
| 628 | else: |
| 629 | _OS_GETTERS = [_ifconfig_getnode, _ip_getnode, _arp_getnode, |
| 630 | _netstat_getnode, _lanscan_getnode] |
| 631 | if os.name == 'posix': |
| 632 | _GETTERS = [_unix_getnode] + _OS_GETTERS |
| 633 | elif os.name == 'nt': |
| 634 | _GETTERS = [_windll_getnode] + _OS_GETTERS |
| 635 | else: |
| 636 | _GETTERS = _OS_GETTERS |
| 637 | |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 638 | _node = None |
| 639 | |
Shantanu | 8b6f652 | 2020-02-05 12:43:09 -0800 | [diff] [blame] | 640 | def getnode(): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 641 | """Get the hardware address as a 48-bit positive integer. |
| 642 | |
| 643 | The first time this runs, it may launch a separate program, which could |
| 644 | be quite slow. If all attempts to obtain the hardware address fail, we |
| 645 | choose a random 48-bit number with its eighth bit set to 1 as recommended |
| 646 | in RFC 4122. |
| 647 | """ |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 648 | global _node |
| 649 | if _node is not None: |
| 650 | return _node |
| 651 | |
Michael Felt | 3a1d50e | 2019-06-15 17:52:29 +0200 | [diff] [blame] | 652 | for getter in _GETTERS + [_random_getnode]: |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 653 | try: |
| 654 | _node = getter() |
| 655 | except: |
| 656 | continue |
Bo Bayles | 6b273f7 | 2018-01-23 19:11:44 -0600 | [diff] [blame] | 657 | if (_node is not None) and (0 <= _node < (1 << 48)): |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 658 | return _node |
Bo Bayles | 6b273f7 | 2018-01-23 19:11:44 -0600 | [diff] [blame] | 659 | assert False, '_random_getnode() returned invalid value: {}'.format(_node) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 660 | |
Antoine Pitrou | a106aec | 2017-09-28 23:03:06 +0200 | [diff] [blame] | 661 | |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 662 | _last_timestamp = None |
| 663 | |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 664 | def uuid1(node=None, clock_seq=None): |
| 665 | """Generate a UUID from a host ID, sequence number, and the current time. |
| 666 | If 'node' is not given, getnode() is used to obtain the hardware |
| 667 | address. If 'clock_seq' is given, it is used as the sequence number; |
| 668 | otherwise a random 14-bit sequence number is chosen.""" |
| 669 | |
| 670 | # When the system provides a version-1 UUID generator, use it (but don't |
| 671 | # use UuidCreate here because its UUIDs don't conform to RFC 4122). |
Antoine Pitrou | a106aec | 2017-09-28 23:03:06 +0200 | [diff] [blame] | 672 | if _generate_time_safe is not None and node is clock_seq is None: |
| 673 | uuid_time, safely_generated = _generate_time_safe() |
Barry Warsaw | 8c130d7 | 2017-02-18 15:45:49 -0500 | [diff] [blame] | 674 | try: |
| 675 | is_safe = SafeUUID(safely_generated) |
| 676 | except ValueError: |
| 677 | is_safe = SafeUUID.unknown |
Antoine Pitrou | a106aec | 2017-09-28 23:03:06 +0200 | [diff] [blame] | 678 | return UUID(bytes=uuid_time, is_safe=is_safe) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 679 | |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 680 | global _last_timestamp |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 681 | import time |
Victor Stinner | 62a68b7 | 2018-12-18 11:45:13 +0100 | [diff] [blame] | 682 | nanoseconds = time.time_ns() |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 683 | # 0x01b21dd213814000 is the number of 100-ns intervals between the |
| 684 | # UUID epoch 1582-10-15 00:00:00 and the Unix epoch 1970-01-01 00:00:00. |
Victor Stinner | 62a68b7 | 2018-12-18 11:45:13 +0100 | [diff] [blame] | 685 | timestamp = nanoseconds // 100 + 0x01b21dd213814000 |
Guido van Rossum | 47b9ff6 | 2006-08-24 00:41:19 +0000 | [diff] [blame] | 686 | if _last_timestamp is not None and timestamp <= _last_timestamp: |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 687 | timestamp = _last_timestamp + 1 |
| 688 | _last_timestamp = timestamp |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 689 | if clock_seq is None: |
| 690 | import random |
Serhiy Storchaka | fa9be4f | 2014-09-06 22:14:04 +0300 | [diff] [blame] | 691 | clock_seq = random.getrandbits(14) # instead of stable storage |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 692 | time_low = timestamp & 0xffffffff |
| 693 | time_mid = (timestamp >> 32) & 0xffff |
| 694 | time_hi_version = (timestamp >> 48) & 0x0fff |
| 695 | clock_seq_low = clock_seq & 0xff |
| 696 | clock_seq_hi_variant = (clock_seq >> 8) & 0x3f |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 697 | if node is None: |
| 698 | node = getnode() |
| 699 | return UUID(fields=(time_low, time_mid, time_hi_version, |
| 700 | clock_seq_hi_variant, clock_seq_low, node), version=1) |
| 701 | |
| 702 | def uuid3(namespace, name): |
| 703 | """Generate a UUID from the MD5 hash of a namespace UUID and a name.""" |
Guido van Rossum | e7ba495 | 2007-06-06 23:52:48 +0000 | [diff] [blame] | 704 | from hashlib import md5 |
Christian Heimes | 7cad53e | 2019-09-13 02:30:00 +0200 | [diff] [blame] | 705 | digest = md5( |
| 706 | namespace.bytes + bytes(name, "utf-8"), |
| 707 | usedforsecurity=False |
| 708 | ).digest() |
| 709 | return UUID(bytes=digest[:16], version=3) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 710 | |
| 711 | def uuid4(): |
| 712 | """Generate a random UUID.""" |
Benjamin Peterson | 788cb52 | 2015-10-29 20:38:04 -0700 | [diff] [blame] | 713 | return UUID(bytes=os.urandom(16), version=4) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 714 | |
| 715 | def uuid5(namespace, name): |
| 716 | """Generate a UUID from the SHA-1 hash of a namespace UUID and a name.""" |
Guido van Rossum | e7ba495 | 2007-06-06 23:52:48 +0000 | [diff] [blame] | 717 | from hashlib import sha1 |
Guido van Rossum | 65b6a80 | 2007-07-09 14:03:08 +0000 | [diff] [blame] | 718 | hash = sha1(namespace.bytes + bytes(name, "utf-8")).digest() |
Guido van Rossum | 5ed033b | 2007-07-09 14:29:40 +0000 | [diff] [blame] | 719 | return UUID(bytes=hash[:16], version=5) |
Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 720 | |
| 721 | # The following standard UUIDs are for use with uuid3() or uuid5(). |
| 722 | |
| 723 | NAMESPACE_DNS = UUID('6ba7b810-9dad-11d1-80b4-00c04fd430c8') |
| 724 | NAMESPACE_URL = UUID('6ba7b811-9dad-11d1-80b4-00c04fd430c8') |
| 725 | NAMESPACE_OID = UUID('6ba7b812-9dad-11d1-80b4-00c04fd430c8') |
| 726 | NAMESPACE_X500 = UUID('6ba7b814-9dad-11d1-80b4-00c04fd430c8') |