Blame - Python/pystrtod.c - platform/external/python/cpython3

2004-06-08 18:52:54 +0000

[diff] [blame]

1

/* -*- Mode: C; c-file-style: "python" -*- */

#include <Python.h>

#include <locale.h>

Mark Dickinson

2009-10-26 14:36:29 +0000

[diff] [blame]

6

/* Case-insensitive string match used for nan and inf detection; t should be

7

lower-case. Returns 1 for a successful match, 0 otherwise. */

Mark Dickinson

2009-05-20 22:05:25 +0000

[diff] [blame]

8

9

static int

10

case_insensitive_match(const char *s, const char *t)

11

{

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

12

while(*t && Py_TOLOWER(*s) == *t) {

s++;

t++;

}

return *t ? 0 : 1;

Mark Dickinson

2009-05-20 22:05:25 +0000

[diff] [blame]

17

}

18

Mark Dickinson

3b38df2

2009-10-26 14:36:29 +0000

[diff] [blame]

19

/* _Py_parse_inf_or_nan: Attempt to parse a string of the form "nan", "inf" or

20

"infinity", with an optional leading sign of "+" or "-". On success,

21

return the NaN or Infinity as a double and set *endptr to point just beyond

22

the successfully parsed portion of the string. On failure, return -1.0 and

23

set *endptr to point to the start of the string. */

24

Mark Dickinson

e383e82

2012-04-29 15:31:56 +0100

[diff] [blame]

25

#ifndef PY_NO_SHORT_FLOAT_REPR

26

27

double

28

_Py_parse_inf_or_nan(const char *p, char **endptr)

{

double retval;

const char *s;

int negate = 0;

s = p;

if (*s == '-') {

negate = 1;

s++;

}

else if (*s == '+') {

40

s++;

41

}

42

if (case_insensitive_match(s, "inf")) {

43

s += 3;

44

if (case_insensitive_match(s, "inity"))

45

s += 5;

46

retval = _Py_dg_infinity(negate);

47

}

48

else if (case_insensitive_match(s, "nan")) {

49

s += 3;

50

retval = _Py_dg_stdnan(negate);

}

else {

s = p;

retval = -1.0;

}

*endptr = (char *)s;

return retval;

}

#else

Mark Dickinson

2009-05-20 22:05:25 +0000

[diff] [blame]

62

double

63

_Py_parse_inf_or_nan(const char *p, char **endptr)

64

{

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

65

double retval;

66

const char *s;

67

int negate = 0;

Mark Dickinson

2009-05-20 22:05:25 +0000

[diff] [blame]

68

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

s = p;

if (*s == '-') {

negate = 1;

s++;

}

else if (*s == '+') {

75

s++;

76

}

77

if (case_insensitive_match(s, "inf")) {

78

s += 3;

79

if (case_insensitive_match(s, "inity"))

80

s += 5;

81

retval = negate ? -Py_HUGE_VAL : Py_HUGE_VAL;

82

}

Mark Dickinson

2009-05-20 22:05:25 +0000

[diff] [blame]

83

#ifdef Py_NAN

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

84

else if (case_insensitive_match(s, "nan")) {

85

s += 3;

86

retval = negate ? -Py_NAN : Py_NAN;

87

}

Mark Dickinson

2009-05-20 22:05:25 +0000

[diff] [blame]

88

#endif

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

else {

s = p;

retval = -1.0;

}

*endptr = (char *)s;

return retval;

Mark Dickinson

2009-05-20 22:05:25 +0000

[diff] [blame]

95

}

96

Mark Dickinson

e383e82

2012-04-29 15:31:56 +0100

[diff] [blame]

97

#endif

98

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

99

/**

Eric Smith

2010-02-22 14:58:30 +0000

[diff] [blame]

100

* _PyOS_ascii_strtod:

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

101

* @nptr: the string to convert to a numeric value.

102

* @endptr: if non-%NULL, it returns the character after

103

* the last character used in the conversion.

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

104

*

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

105

* Converts a string to a #gdouble value.

106

* This function behaves like the standard strtod() function

107

* does in the C locale. It does this without actually

108

* changing the current locale, since that would not be

109

* thread-safe.

110

*

111

* This function is typically used when reading configuration

112

* files or other non-user input that should be locale independent.

113

* To handle input from the user you should normally use the

114

* locale-sensitive system strtod() function.

115

*

116

* If the correct value would cause overflow, plus or minus %HUGE_VAL

117

* is returned (according to the sign of the value), and %ERANGE is

118

* stored in %errno. If the correct value would cause underflow,

119

* zero is returned and %ERANGE is stored in %errno.

Thomas Wouters

4d70c3d

2006-06-08 14:42:34 +0000

[diff] [blame]

120

* If memory allocation fails, %ENOMEM is stored in %errno.

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

121

*

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

122

* This function resets %errno before calling strtod() so that

123

* you can reliably detect overflow and underflow.

124

*

125

* Return value: the #gdouble value.

126

**/

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

127

128

#ifndef PY_NO_SHORT_FLOAT_REPR

129

Eric Smith

2010-02-22 14:58:30 +0000

[diff] [blame]

130

static double

Mark Dickinson

2009-05-03 20:33:40 +0000

[diff] [blame]

131

_PyOS_ascii_strtod(const char *nptr, char **endptr)

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

132

{

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

133

double result;

134

_Py_SET_53BIT_PRECISION_HEADER;

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

135

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

136

assert(nptr != NULL);

137

/* Set errno to zero, so that we can distinguish zero results

138

and underflows */

139

errno = 0;

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

140

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

141

_Py_SET_53BIT_PRECISION_START;

142

result = _Py_dg_strtod(nptr, endptr);

143

_Py_SET_53BIT_PRECISION_END;

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

144

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

145

if (*endptr == nptr)

146

/* string might represent an inf or nan */

147

result = _Py_parse_inf_or_nan(nptr, endptr);

Mark Dickinson

2009-05-20 22:05:25 +0000

[diff] [blame]

148

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

149

return result;

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

}

#else

/*

Use system strtod; since strtod is locale aware, we may

157

have to first fix the decimal separator.

158

159

Note that unlike _Py_dg_strtod, the system strtod may not always give

160

correctly rounded results.

161

*/

162

Eric Smith

2010-02-22 14:58:30 +0000

[diff] [blame]

163

static double

Mark Dickinson

2009-05-03 20:33:40 +0000

[diff] [blame]

164

_PyOS_ascii_strtod(const char *nptr, char **endptr)

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

165

{

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

166

char *fail_pos;

Georg Brandl

6083a4b

2013-10-14 06:51:46 +0200

[diff] [blame]

167

double val;

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

168

struct lconv *locale_data;

169

const char *decimal_point;

170

size_t decimal_point_len;

171

const char *p, *decimal_point_pos;

172

const char *end = NULL; /* Silence gcc */

173

const char *digits_pos = NULL;

174

int negate = 0;

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

175

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

176

assert(nptr != NULL);

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

177

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

178

fail_pos = NULL;

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

179

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

180

locale_data = localeconv();

181

decimal_point = locale_data->decimal_point;

182

decimal_point_len = strlen(decimal_point);

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

183

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

184

assert(decimal_point_len != 0);

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

185

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

186

decimal_point_pos = NULL;

Christian Heimes

faf2f63

2008-01-06 16:59:19 +0000

[diff] [blame]

187

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

188

/* Parse infinities and nans */

189

val = _Py_parse_inf_or_nan(nptr, endptr);

190

if (*endptr != nptr)

191

return val;

Mark Dickinson

2009-05-20 22:05:25 +0000

[diff] [blame]

192

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

193

/* Set errno to zero, so that we can distinguish zero results

194

and underflows */

195

errno = 0;

Mark Dickinson

2009-04-26 15:30:47 +0000

[diff] [blame]

196

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

197

/* We process the optional sign manually, then pass the remainder to

198

the system strtod. This ensures that the result of an underflow

199

has the correct sign. (bug #1725) */

200

p = nptr;

201

/* Process leading sign, if present */

if (*p == '-') {

negate = 1;

p++;

}

else if (*p == '+') {

207

p++;

208

}

Christian Heimes

faf2f63

2008-01-06 16:59:19 +0000

[diff] [blame]

209

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

210

/* Some platform strtods accept hex floats; Python shouldn't (at the

211

moment), so we check explicitly for strings starting with '0x'. */

212

if (*p == '0' && (*(p+1) == 'x' || *(p+1) == 'X'))

213

goto invalid_string;

Mark Dickinson

2009-04-26 15:30:47 +0000

[diff] [blame]

214

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

215

/* Check that what's left begins with a digit or decimal point */

216

if (!Py_ISDIGIT(*p) && *p != '.')

217

goto invalid_string;

Mark Dickinson

2009-04-26 15:30:47 +0000

[diff] [blame]

218

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

219

digits_pos = p;

220

if (decimal_point[0] != '.' ||

221

decimal_point[1] != 0)

222

{

223

/* Look for a '.' in the input; if present, it'll need to be

224

swapped for the current locale's decimal point before we

225

call strtod. On the other hand, if we find the current

226

locale's decimal point then the input is invalid. */

227

while (Py_ISDIGIT(*p))

228

p++;

Neal Norwitz

e7214a1

2005-12-18 05:03:17 +0000

[diff] [blame]

229

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

230

if (*p == '.')

231

{

232

decimal_point_pos = p++;

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

233

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

234

/* locate end of number */

235

while (Py_ISDIGIT(*p))

236

p++;

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

237

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

238

if (*p == 'e' || *p == 'E')

239

p++;

240

if (*p == '+' || *p == '-')

241

p++;

242

while (Py_ISDIGIT(*p))

p++;

end = p;

}

else if (strncmp(p, decimal_point, decimal_point_len) == 0)

247

/* Python bug #1417699 */

248

goto invalid_string;

249

/* For the other cases, we need not convert the decimal

250

point */

251

}

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

252

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

253

if (decimal_point_pos) {

254

char *copy, *c;

255

/* Create a copy of the input, with the '.' converted to the

256

locale-specific decimal point */

257

copy = (char *)PyMem_MALLOC(end - digits_pos +

258

1 + decimal_point_len);

259

if (copy == NULL) {

260

*endptr = (char *)nptr;

261

errno = ENOMEM;

262

return val;

263

}

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

264

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

265

c = copy;

266

memcpy(c, digits_pos, decimal_point_pos - digits_pos);

267

c += decimal_point_pos - digits_pos;

268

memcpy(c, decimal_point, decimal_point_len);

269

c += decimal_point_len;

270

memcpy(c, decimal_point_pos + 1,

271

end - (decimal_point_pos + 1));

272

c += end - (decimal_point_pos + 1);

273

*c = 0;

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

274

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

275

val = strtod(copy, &fail_pos);

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

276

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

277

if (fail_pos)

278

{

279

if (fail_pos > decimal_point_pos)

280

fail_pos = (char *)digits_pos +

281

(fail_pos - copy) -

282

(decimal_point_len - 1);

283

else

284

fail_pos = (char *)digits_pos +

285

(fail_pos - copy);

286

}

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

287

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

288

PyMem_FREE(copy);

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

289

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

290

}

291

else {

292

val = strtod(digits_pos, &fail_pos);

293

}

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

294

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

295

if (fail_pos == digits_pos)

296

goto invalid_string;

Christian Heimes

faf2f63

2008-01-06 16:59:19 +0000

[diff] [blame]

297

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

298

if (negate && fail_pos != nptr)

299

val = -val;

300

*endptr = fail_pos;

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

301

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

302

return val;

Mark Dickinson

2009-04-26 15:30:47 +0000

[diff] [blame]

303

304

invalid_string:

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

305

*endptr = (char*)nptr;

306

errno = EINVAL;

307

return -1.0;

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

308

}

309

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

310

#endif

311

Eric Smith

2010-02-22 14:58:30 +0000

[diff] [blame]

312

/* PyOS_string_to_double converts a null-terminated byte string s (interpreted

313

as a string of ASCII characters) to a float. The string should not have

314

leading or trailing whitespace. The conversion is independent of the

315

current locale.

Mark Dickinson

2009-05-03 20:33:40 +0000

[diff] [blame]

316

317

If endptr is NULL, try to convert the whole string. Raise ValueError and

318

return -1.0 if the string is not a valid representation of a floating-point

319

number.

320

321

If endptr is non-NULL, try to convert as much of the string as possible.

322

If no initial segment of the string is the valid representation of a

323

floating-point number then *endptr is set to point to the beginning of the

324

string, -1.0 is returned and again ValueError is raised.

325

326

On overflow (e.g., when trying to convert '1e500' on an IEEE 754 machine),

327

if overflow_exception is NULL then +-Py_HUGE_VAL is returned, and no Python

Serhiy Storchaka

56a6d85

2014-12-01 18:28:43 +0200

[diff] [blame]

328

exception is raised. Otherwise, overflow_exception should point to

Mark Dickinson

2009-05-03 20:33:40 +0000

[diff] [blame]

329

a Python exception, this exception will be raised, -1.0 will be returned,

330

and *endptr will point just past the end of the converted value.

331

332

If any other failure occurs (for example lack of memory), -1.0 is returned

333

and the appropriate Python exception will have been set.

*/

double

PyOS_string_to_double(const char *s,

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

338

char **endptr,

339

PyObject *overflow_exception)

Mark Dickinson

2009-05-03 20:33:40 +0000

[diff] [blame]

340

{

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

341

double x, result=-1.0;

342

char *fail_pos;

Mark Dickinson

2009-05-03 20:33:40 +0000

[diff] [blame]

343

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

344

errno = 0;

345

PyFPE_START_PROTECT("PyOS_string_to_double", return -1.0)

346

x = _PyOS_ascii_strtod(s, &fail_pos);

347

PyFPE_END_PROTECT(x)

Mark Dickinson

2009-05-03 20:33:40 +0000

[diff] [blame]

348

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

349

if (errno == ENOMEM) {

350

PyErr_NoMemory();

351

fail_pos = (char *)s;

352

}

353

else if (!endptr && (fail_pos == s || *fail_pos != '\0'))

354

PyErr_Format(PyExc_ValueError,

355

"could not convert string to float: "

356

"%.200s", s);

357

else if (fail_pos == s)

358

PyErr_Format(PyExc_ValueError,

359

"could not convert string to float: "

360

"%.200s", s);

361

else if (errno == ERANGE && fabs(x) >= 1.0 && overflow_exception)

362

PyErr_Format(overflow_exception,

363

"value too large to convert to float: "

364

"%.200s", s);

365

else

366

result = x;

Mark Dickinson

2009-05-03 20:33:40 +0000

[diff] [blame]

367

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

368

if (endptr != NULL)

369

*endptr = fail_pos;

370

return result;

Mark Dickinson

2009-05-03 20:33:40 +0000

[diff] [blame]

371

}

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

372

Eric Smith

2010-02-22 14:58:30 +0000

[diff] [blame]

373

#ifdef PY_NO_SHORT_FLOAT_REPR

374

Eric Smith

2008-04-30 02:12:09 +0000

[diff] [blame]

375

/* Given a string that may have a decimal point in the current

376

locale, change it back to a dot. Since the string cannot get

377

longer, no need for a maximum buffer size parameter. */

378

Py_LOCAL_INLINE(void)

379

change_decimal_from_locale_to_dot(char* buffer)

380

{

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

381

struct lconv *locale_data = localeconv();

382

const char *decimal_point = locale_data->decimal_point;

Eric Smith

2008-04-30 02:12:09 +0000

[diff] [blame]

383

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

384

if (decimal_point[0] != '.' || decimal_point[1] != 0) {

385

size_t decimal_point_len = strlen(decimal_point);

Eric Smith

2008-04-30 02:12:09 +0000

[diff] [blame]

386

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

387

if (*buffer == '+' || *buffer == '-')

388

buffer++;

389

while (Py_ISDIGIT(*buffer))

390

buffer++;

391

if (strncmp(buffer, decimal_point, decimal_point_len) == 0) {

392

*buffer = '.';

393

buffer++;

394

if (decimal_point_len > 1) {

395

/* buffer needs to get smaller */

396

size_t rest_len = strlen(buffer +

397

(decimal_point_len - 1));

398

memmove(buffer,

399

buffer + (decimal_point_len - 1),

400

rest_len);

401

buffer[rest_len] = 0;

402

}

403

}

404

}

Eric Smith

2008-04-30 02:12:09 +0000

[diff] [blame]

405

}

406

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

407

Christian Heimes

2008-02-22 16:37:40 +0000

[diff] [blame]

408

/* From the C99 standard, section 7.19.6:

409

The exponent always contains at least two digits, and only as many more digits

410

as necessary to represent the exponent.

411

*/

412

#define MIN_EXPONENT_DIGITS 2

413

Eric Smith

2008-04-30 02:12:09 +0000

[diff] [blame]

414

/* Ensure that any exponent, if present, is at least MIN_EXPONENT_DIGITS

415

in length. */

416

Py_LOCAL_INLINE(void)

Mark Dickinson

ce95e56

2009-04-26 20:02:24 +0000

[diff] [blame]

417

ensure_minimum_exponent_length(char* buffer, size_t buf_size)

Eric Smith

2008-04-30 02:12:09 +0000

[diff] [blame]

418

{

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

419

char *p = strpbrk(buffer, "eE");

420

if (p && (*(p + 1) == '-' || *(p + 1) == '+')) {

421

char *start = p + 2;

422

int exponent_digit_cnt = 0;

423

int leading_zero_cnt = 0;

424

int in_leading_zeros = 1;

425

int significant_digit_cnt;

Eric Smith

2008-04-30 02:12:09 +0000

[diff] [blame]

426

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

427

/* Skip over the exponent and the sign. */

428

p += 2;

Eric Smith

2008-04-30 02:12:09 +0000

[diff] [blame]

429

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

430

/* Find the end of the exponent, keeping track of leading

431

zeros. */

432

while (*p && Py_ISDIGIT(*p)) {

433

if (in_leading_zeros && *p == '0')

434

++leading_zero_cnt;

435

if (*p != '0')

436

in_leading_zeros = 0;

437

++p;

438

++exponent_digit_cnt;

439

}

Eric Smith

2008-04-30 02:12:09 +0000

[diff] [blame]

440

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

441

significant_digit_cnt = exponent_digit_cnt - leading_zero_cnt;

442

if (exponent_digit_cnt == MIN_EXPONENT_DIGITS) {

443

/* If there are 2 exactly digits, we're done,

444

regardless of what they contain */

445

}

446

else if (exponent_digit_cnt > MIN_EXPONENT_DIGITS) {

447

int extra_zeros_cnt;

Eric Smith

2008-04-30 02:12:09 +0000

[diff] [blame]

448

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

449

/* There are more than 2 digits in the exponent. See

450

if we can delete some of the leading zeros */

451

if (significant_digit_cnt < MIN_EXPONENT_DIGITS)

452

significant_digit_cnt = MIN_EXPONENT_DIGITS;

453

extra_zeros_cnt = exponent_digit_cnt -

454

significant_digit_cnt;

Eric Smith

2008-04-30 02:12:09 +0000

[diff] [blame]

455

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

456

/* Delete extra_zeros_cnt worth of characters from the

457

front of the exponent */

458

assert(extra_zeros_cnt >= 0);

Eric Smith

2008-04-30 02:12:09 +0000

[diff] [blame]

459

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

460

/* Add one to significant_digit_cnt to copy the

461

trailing 0 byte, thus setting the length */

462

memmove(start,

463

start + extra_zeros_cnt,

464

significant_digit_cnt + 1);

465

}

466

else {

467

/* If there are fewer than 2 digits, add zeros

468

until there are 2, if there's enough room */

469

int zeros = MIN_EXPONENT_DIGITS - exponent_digit_cnt;

470

if (start + zeros + exponent_digit_cnt + 1

471

< buffer + buf_size) {

472

memmove(start + zeros, start,

473

exponent_digit_cnt + 1);

474

memset(start, '0', zeros);

475

}

476

}

477

}

Eric Smith

2008-04-30 02:12:09 +0000

[diff] [blame]

478

}

479

Mark Dickinson

2009-04-29 18:47:07 +0000

[diff] [blame]

480

/* Remove trailing zeros after the decimal point from a numeric string; also

481

remove the decimal point if all digits following it are zero. The numeric

482

string must end in '\0', and should not have any leading or trailing

483

whitespace. Assumes that the decimal point is '.'. */

Eric Smith

2008-04-30 02:12:09 +0000

[diff] [blame]

484

Py_LOCAL_INLINE(void)

Mark Dickinson

2009-04-29 18:47:07 +0000

[diff] [blame]

485

remove_trailing_zeros(char *buffer)

Eric Smith

2008-04-30 02:12:09 +0000

[diff] [blame]

486

{

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

487

char *old_fraction_end, *new_fraction_end, *end, *p;

Mark Dickinson

2009-04-29 18:47:07 +0000

[diff] [blame]

488

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

489

p = buffer;

490

if (*p == '-' || *p == '+')

491

/* Skip leading sign, if present */

492

++p;

493

while (Py_ISDIGIT(*p))

494

++p;

Mark Dickinson

2009-04-29 18:47:07 +0000

[diff] [blame]

495

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

496

/* if there's no decimal point there's nothing to do */

497

if (*p++ != '.')

498

return;

Mark Dickinson

2009-04-29 18:47:07 +0000

[diff] [blame]

499

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

500

/* scan any digits after the point */

501

while (Py_ISDIGIT(*p))

502

++p;

503

old_fraction_end = p;

Mark Dickinson

2009-04-29 18:47:07 +0000

[diff] [blame]

504

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

505

/* scan up to ending '\0' */

506

while (*p != '\0')

507

p++;

508

/* +1 to make sure that we move the null byte as well */

509

end = p+1;

Mark Dickinson

2009-04-29 18:47:07 +0000

[diff] [blame]

510

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

511

/* scan back from fraction_end, looking for removable zeros */

512

p = old_fraction_end;

513

while (*(p-1) == '0')

514

--p;

515

/* and remove point if we've got that far */

516

if (*(p-1) == '.')

517

--p;

518

new_fraction_end = p;

Mark Dickinson

2009-04-29 18:47:07 +0000

[diff] [blame]

519

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

520

memmove(new_fraction_end, old_fraction_end, end-old_fraction_end);

Mark Dickinson

2009-04-29 18:47:07 +0000

[diff] [blame]

521

}

522

523

/* Ensure that buffer has a decimal point in it. The decimal point will not

524

be in the current locale, it will always be '.'. Don't add a decimal point

525

if an exponent is present. Also, convert to exponential notation where

526

adding a '.0' would produce too many significant digits (see issue 5864).

527

528

Returns a pointer to the fixed buffer, or NULL on failure.

529

*/

530

Py_LOCAL_INLINE(char *)

531

ensure_decimal_point(char* buffer, size_t buf_size, int precision)

532

{

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

533

int digit_count, insert_count = 0, convert_to_exp = 0;

534

char *chars_to_insert, *digits_start;

Eric Smith

2008-04-30 02:12:09 +0000

[diff] [blame]

535

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

536

/* search for the first non-digit character */

537

char *p = buffer;

538

if (*p == '-' || *p == '+')

539

/* Skip leading sign, if present. I think this could only

540

ever be '-', but it can't hurt to check for both. */

541

++p;

542

digits_start = p;

543

while (*p && Py_ISDIGIT(*p))

544

++p;

545

digit_count = Py_SAFE_DOWNCAST(p - digits_start, Py_ssize_t, int);

Eric Smith

2008-04-30 02:12:09 +0000

[diff] [blame]

546

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

547

if (*p == '.') {

548

if (Py_ISDIGIT(*(p+1))) {

549

/* Nothing to do, we already have a decimal

550

point and a digit after it */

551

}

552

else {

553

/* We have a decimal point, but no following

554

digit. Insert a zero after the decimal. */

555

/* can't ever get here via PyOS_double_to_string */

556

assert(precision == -1);

557

++p;

558

chars_to_insert = "0";

insert_count = 1;

}

}

else if (!(*p == 'e' || *p == 'E')) {

563

/* Don't add ".0" if we have an exponent. */

564

if (digit_count == precision) {

565

/* issue 5864: don't add a trailing .0 in the case

566

where the '%g'-formatted result already has as many

567

significant digits as were requested. Switch to

568

exponential notation instead. */

569

convert_to_exp = 1;

570

/* no exponent, no point, and we shouldn't land here

571

for infs and nans, so we must be at the end of the

string. */

assert(*p == '\0');

}

else {

assert(precision == -1 || digit_count < precision);

577

chars_to_insert = ".0";

insert_count = 2;

}

}

if (insert_count) {

size_t buf_len = strlen(buffer);

583

if (buf_len + insert_count + 1 >= buf_size) {

584

/* If there is not enough room in the buffer

585

for the additional text, just skip it. It's

586

not worth generating an error over. */

587

}

588

else {

589

memmove(p + insert_count, p,

590

buffer + strlen(buffer) - p + 1);

591

memcpy(p, chars_to_insert, insert_count);

592

}

593

}

594

if (convert_to_exp) {

int written;

size_t buf_avail;

p = digits_start;

/* insert decimal point */

599

assert(digit_count >= 1);

600

memmove(p+2, p+1, digit_count); /* safe, but overwrites nul */

601

p[1] = '.';

602

p += digit_count+1;

603

assert(p <= buf_size+buffer);

604

buf_avail = buf_size+buffer-p;

605

if (buf_avail == 0)

606

return NULL;

607

/* Add exponent. It's okay to use lower case 'e': we only

608

arrive here as a result of using the empty format code or

609

repr/str builtins and those never want an upper case 'E' */

610

written = PyOS_snprintf(p, buf_avail, "e%+.02d", digit_count-1);

611

if (!(0 <= written &&

612

written < Py_SAFE_DOWNCAST(buf_avail, size_t, int)))

613

/* output truncated, or something else bad happened */

614

return NULL;

615

remove_trailing_zeros(buffer);

616

}

617

return buffer;

Eric Smith

2008-04-30 02:12:09 +0000

[diff] [blame]

618

}

619

Christian Heimes

2008-02-22 16:37:40 +0000

[diff] [blame]

620

/* see FORMATBUFLEN in unicodeobject.c */

621

#define FLOAT_FORMATBUFLEN 120

622

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

623

/**

Eric Smith

2010-02-22 14:58:30 +0000

[diff] [blame]

624

* _PyOS_ascii_formatd:

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

625

* @buffer: A buffer to place the resulting string in

Christian Heimes

2008-03-18 15:15:01 +0000

[diff] [blame]

626

* @buf_size: The length of the buffer.

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

627

* @format: The printf()-style format to use for the

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

628

* code to use for converting.

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

629

* @d: The #gdouble to convert

Eric Smith

2010-02-22 14:58:30 +0000

[diff] [blame]

630

* @precision: The precision to use when formatting.

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

631

*

632

* Converts a #gdouble to a string, using the '.' as

633

* decimal point. To format the number you pass in

634

* a printf()-style format string. Allowed conversion

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

635

* specifiers are 'e', 'E', 'f', 'F', 'g', 'G', and 'Z'.

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

636

*

Christian Heimes

2008-03-18 15:15:01 +0000

[diff] [blame]

637

* 'Z' is the same as 'g', except it always has a decimal and

638

* at least one digit after the decimal.

Christian Heimes

2008-02-22 16:37:40 +0000

[diff] [blame]

639

*

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

640

* Return value: The pointer to the buffer with the converted string.

Mark Dickinson

2009-04-29 18:47:07 +0000

[diff] [blame]

641

* On failure returns NULL but does not set any Python exception.

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

642

**/

Eric Smith

2010-02-22 14:58:30 +0000

[diff] [blame]

643

static char *

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

644

_PyOS_ascii_formatd(char *buffer,

size_t buf_size,

const char *format,

double d,

int precision)

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

649

{

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

650

char format_char;

651

size_t format_len = strlen(format);

Christian Heimes

2008-02-22 16:37:40 +0000

[diff] [blame]

652

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

653

/* Issue 2264: code 'Z' requires copying the format. 'Z' is 'g', but

654

also with at least one character past the decimal. */

655

char tmp_format[FLOAT_FORMATBUFLEN];

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

656

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

657

/* The last character in the format string must be the format char */

658

format_char = format[format_len - 1];

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

659

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

660

if (format[0] != '%')

661

return NULL;

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

662

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

663

/* I'm not sure why this test is here. It's ensuring that the format

664

string after the first character doesn't have a single quote, a

665

lowercase l, or a percent. This is the reverse of the commented-out

666

test about 10 lines ago. */

667

if (strpbrk(format + 1, "'l%"))

668

return NULL;

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

669

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

670

/* Also curious about this function is that it accepts format strings

671

like "%xg", which are invalid for floats. In general, the

672

interface to this function is not very good, but changing it is

673

difficult because it's a public API. */

Christian Heimes

2008-03-18 15:15:01 +0000

[diff] [blame]

674

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

675

if (!(format_char == 'e' || format_char == 'E' ||

676

format_char == 'f' || format_char == 'F' ||

677

format_char == 'g' || format_char == 'G' ||

678

format_char == 'Z'))

679

return NULL;

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

680

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

681

/* Map 'Z' format_char to 'g', by copying the format string and

682

replacing the final char with a 'g' */

683

if (format_char == 'Z') {

684

if (format_len + 1 >= sizeof(tmp_format)) {

685

/* The format won't fit in our copy. Error out. In

686

practice, this will never happen and will be

687

detected by returning NULL */

688

return NULL;

689

}

690

strcpy(tmp_format, format);

691

tmp_format[format_len - 1] = 'g';

692

format = tmp_format;

693

}

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

694

Christian Heimes

2008-03-18 15:15:01 +0000

[diff] [blame]

695

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

696

/* Have PyOS_snprintf do the hard work */

697

PyOS_snprintf(buffer, buf_size, format, d);

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

698

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

699

/* Do various fixups on the return string */

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

700

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

701

/* Get the current locale, and find the decimal point string.

702

Convert that string back to a dot. */

703

change_decimal_from_locale_to_dot(buffer);

Christian Heimes

2008-02-22 16:37:40 +0000

[diff] [blame]

704

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

705

/* If an exponent exists, ensure that the exponent is at least

706

MIN_EXPONENT_DIGITS digits, providing the buffer is large enough

707

for the extra zeros. Also, if there are more than

708

MIN_EXPONENT_DIGITS, remove as many zeros as possible until we get

709

back to MIN_EXPONENT_DIGITS */

710

ensure_minimum_exponent_length(buffer, buf_size);

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

711

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

712

/* If format_char is 'Z', make sure we have at least one character

713

after the decimal point (and make sure we have a decimal point);

714

also switch to exponential notation in some edge cases where the

715

extra character would produce more significant digits that we

716

really want. */

717

if (format_char == 'Z')

718

buffer = ensure_decimal_point(buffer, buf_size, precision);

Christian Heimes

2008-03-18 15:15:01 +0000

[diff] [blame]

719

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

720

return buffer;

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

721

}

722

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

723

/* The fallback code to use if _Py_dg_dtoa is not available. */

724

725

PyAPI_FUNC(char *) PyOS_double_to_string(double val,

char format_code,

int precision,

int flags,

int *type)

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

730

{

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

char format[32];

Py_ssize_t bufsize;

char *buf;

int t, exp;

int upper = 0;

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

736

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

737

/* Validate format_code, and map upper and lower case */

738

switch (format_code) {

739

case 'e': /* exponent */

740

case 'f': /* fixed */

741

case 'g': /* general */

break;

case 'E':

upper = 1;

format_code = 'e';

break;

case 'F':

upper = 1;

format_code = 'f';

break;

case 'G':

upper = 1;

format_code = 'g';

break;

case 'r': /* repr format */

756

/* Supplied precision is unused, must be 0. */

757

if (precision != 0) {

758

PyErr_BadInternalCall();

759

return NULL;

760

}

761

/* The repr() precision (17 significant decimal digits) is the

762

minimal number that is guaranteed to have enough precision

763

so that if the number is read back in the exact same binary

764

value is recreated. This is true for IEEE floating point

765

by design, and also happens to work for all other modern

hardware. */

precision = 17;

format_code = 'g';

break;

default:

PyErr_BadInternalCall();

772

return NULL;

773

}

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

774

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

775

/* Here's a quick-and-dirty calculation to figure out how big a buffer

776

we need. In general, for a finite float we need:

Mark Dickinson

2009-05-01 11:42:00 +0000

[diff] [blame]

777

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

778

1 byte for each digit of the decimal significand, and

Mark Dickinson

2009-05-01 11:42:00 +0000

[diff] [blame]

779

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

780

1 for a possible sign

781

1 for a possible decimal point

782

2 for a possible [eE][+-]

783

1 for each digit of the exponent; if we allow 19 digits

784

total then we're safe up to exponents of 2**63.

785

1 for the trailing nul byte

Mark Dickinson

2009-05-01 11:42:00 +0000

[diff] [blame]

786

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

787

This gives a total of 24 + the number of digits in the significand,

788

and the number of digits in the significand is:

Mark Dickinson

2009-05-01 11:42:00 +0000

[diff] [blame]

789

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

790

for 'g' format: at most precision, except possibly

791

when precision == 0, when it's 1.

792

for 'e' format: precision+1

793

for 'f' format: precision digits after the point, at least 1

794

before. To figure out how many digits appear before the point

795

we have to examine the size of the number. If fabs(val) < 1.0

796

then there will be only one digit before the point. If

797

fabs(val) >= 1.0, then there are at most

Mark Dickinson

2009-05-01 11:42:00 +0000

[diff] [blame]

798

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

799

1+floor(log10(ceiling(fabs(val))))

Mark Dickinson

2009-05-01 11:42:00 +0000

[diff] [blame]

800

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

801

digits before the point (where the 'ceiling' allows for the

802

possibility that the rounding rounds the integer part of val

803

up). A safe upper bound for the above quantity is

804

1+floor(exp/3), where exp is the unique integer such that 0.5

805

<= fabs(val)/2**exp < 1.0. This exp can be obtained from

806

frexp.

Mark Dickinson

2009-05-01 11:42:00 +0000

[diff] [blame]

807

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

808

So we allow room for precision+1 digits for all formats, plus an

809

extra floor(exp/3) digits for 'f' format.

Mark Dickinson

2009-05-01 11:42:00 +0000

[diff] [blame]

810

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

811

*/

Mark Dickinson

2009-05-01 11:42:00 +0000

[diff] [blame]

812

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

813

if (Py_IS_NAN(val) || Py_IS_INFINITY(val))

814

/* 3 for 'inf'/'nan', 1 for sign, 1 for '\0' */

815

bufsize = 5;

816

else {

817

bufsize = 25 + precision;

818

if (format_code == 'f' && fabs(val) >= 1.0) {

frexp(val, &exp);

bufsize += exp/3;

}

}

Mark Dickinson

2009-05-01 11:42:00 +0000

[diff] [blame]

823

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

824

buf = PyMem_Malloc(bufsize);

if (buf == NULL) {

PyErr_NoMemory();

return NULL;

}

Mark Dickinson

2009-05-01 11:42:00 +0000

[diff] [blame]

829

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

830

/* Handle nan and inf. */

831

if (Py_IS_NAN(val)) {

832

strcpy(buf, "nan");

833

t = Py_DTST_NAN;

834

} else if (Py_IS_INFINITY(val)) {

835

if (copysign(1., val) == 1.)

strcpy(buf, "inf");

else

strcpy(buf, "-inf");

t = Py_DTST_INFINITE;

840

} else {

841

t = Py_DTST_FINITE;

842

if (flags & Py_DTSF_ADD_DOT_0)

843

format_code = 'Z';

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

844

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

845

PyOS_snprintf(format, sizeof(format), "%%%s.%i%c",

846

(flags & Py_DTSF_ALT ? "#" : ""), precision,

847

format_code);

848

_PyOS_ascii_formatd(buf, bufsize, format, val, precision);

849

}

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

850

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

851

/* Add sign when requested. It's convenient (esp. when formatting

852

complex numbers) to include a sign even for inf and nan. */

853

if (flags & Py_DTSF_SIGN && buf[0] != '-') {

854

size_t len = strlen(buf);

855

/* the bufsize calculations above should ensure that we've got

856

space to add a sign */

857

assert((size_t)bufsize >= len+2);

858

memmove(buf+1, buf, len+1);

buf[0] = '+';

}

if (upper) {

/* Convert to upper case. */

863

char *p1;

864

for (p1 = buf; *p1; p1++)

865

*p1 = Py_TOUPPER(*p1);

866

}

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

867

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

868

if (type)

869

*type = t;

870

return buf;

Martin v. Löwis

2004-06-08 18:52:54 +0000

[diff] [blame]

871

}

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

#else

/* _Py_dg_dtoa is available. */

876

877

/* I'm using a lookup table here so that I don't have to invent a non-locale

878

specific way to convert to uppercase */

#define OFS_INF 0

#define OFS_NAN 1

#define OFS_E 2

/* The lengths of these are known to the code below, so don't change them */

884

static char *lc_float_strings[] = {

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

885

"inf",

886

"nan",

887

"e",

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

888

};

889

static char *uc_float_strings[] = {

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

890

"INF",

891

"NAN",

892

"E",

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

};

/* Convert a double d to a string, and return a PyMem_Malloc'd block of

897

memory contain the resulting string.

898

899

Arguments:

900

d is the double to be converted

Eric Smith

2009-05-05 14:04:18 +0000

[diff] [blame]

901

format_code is one of 'e', 'f', 'g', 'r'. 'e', 'f' and 'g'

902

correspond to '%e', '%f' and '%g'; 'r' corresponds to repr.

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

903

mode is one of '0', '2' or '3', and is completely determined by

Eric Smith

2009-05-05 14:04:18 +0000

[diff] [blame]

904

format_code: 'e' and 'g' use mode 2; 'f' mode 3, 'r' mode 0.

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

905

precision is the desired precision

906

always_add_sign is nonzero if a '+' sign should be included for positive

907

numbers

908

add_dot_0_if_integer is nonzero if integers in non-exponential form

Eric Smith

2009-05-05 14:04:18 +0000

[diff] [blame]

909

should have ".0" added. Only applies to format codes 'r' and 'g'.

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

910

use_alt_formatting is nonzero if alternative formatting should be

Eric Smith

2009-05-05 14:04:18 +0000

[diff] [blame]

911

used. Only applies to format codes 'e', 'f' and 'g'. For code 'g',

912

at most one of use_alt_formatting and add_dot_0_if_integer should

913

be nonzero.

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

914

type, if non-NULL, will be set to one of these constants to identify

915

the type of the 'd' argument:

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

916

Py_DTST_FINITE

917

Py_DTST_INFINITE

918

Py_DTST_NAN

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

919

920

Returns a PyMem_Malloc'd block of memory containing the resulting string,

921

or NULL on error. If NULL is returned, the Python error has been set.

*/

static char *

format_float_short(double d, char format_code,

Victor Stinner

7b25135

2013-06-24 23:37:40 +0200

[diff] [blame]

926

int mode, int precision,

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

927

int always_add_sign, int add_dot_0_if_integer,

928

int use_alt_formatting, char **float_strings, int *type)

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

929

{

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

930

char *buf = NULL;

931

char *p = NULL;

932

Py_ssize_t bufsize = 0;

933

char *digits, *digits_end;

934

int decpt_as_int, sign, exp_len, exp = 0, use_exp = 0;

935

Py_ssize_t decpt, digits_len, vdigits_start, vdigits_end;

936

_Py_SET_53BIT_PRECISION_HEADER;

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

937

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

938

/* _Py_dg_dtoa returns a digit string (no decimal point or exponent).

939

Must be matched by a call to _Py_dg_freedtoa. */

940

_Py_SET_53BIT_PRECISION_START;

941

digits = _Py_dg_dtoa(d, mode, precision, &decpt_as_int, &sign,

942

&digits_end);

943

_Py_SET_53BIT_PRECISION_END;

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

944

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

945

decpt = (Py_ssize_t)decpt_as_int;

946

if (digits == NULL) {

947

/* The only failure mode is no memory. */

PyErr_NoMemory();

goto exit;

}

assert(digits_end != NULL && digits_end >= digits);

952

digits_len = digits_end - digits;

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

953

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

954

if (digits_len && !Py_ISDIGIT(digits[0])) {

955

/* Infinities and nans here; adapt Gay's output,

956

so convert Infinity to inf and NaN to nan, and

957

ignore sign of nan. Then return. */

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

958

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

959

/* ignore the actual sign of a nan */

960

if (digits[0] == 'n' || digits[0] == 'N')

961

sign = 0;

Mark Dickinson

ad476da

2009-04-23 19:14:16 +0000

[diff] [blame]

962

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

963

/* We only need 5 bytes to hold the result "+inf\0" . */

964

bufsize = 5; /* Used later in an assert. */

965

buf = (char *)PyMem_Malloc(bufsize);

if (buf == NULL) {

PyErr_NoMemory();

goto exit;

}

p = buf;

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

971

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

if (sign == 1) {

*p++ = '-';

}

else if (always_add_sign) {

976

*p++ = '+';

977

}

978

if (digits[0] == 'i' || digits[0] == 'I') {

979

strncpy(p, float_strings[OFS_INF], 3);

980

p += 3;

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

981

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

982

if (type)

983

*type = Py_DTST_INFINITE;

984

}

985

else if (digits[0] == 'n' || digits[0] == 'N') {

986

strncpy(p, float_strings[OFS_NAN], 3);

987

p += 3;

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

988

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

if (type)

*type = Py_DTST_NAN;

}

else {

/* shouldn't get here: Gay's code should always return

994

something starting with a digit, an 'I', or 'N' */

995

strncpy(p, "ERR", 3);

Brett Cannon

b94767f

2011-02-22 20:15:44 +0000

[diff] [blame]

996

/* p += 3; */

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

assert(0);

}

goto exit;

}

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1001

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1002

/* The result must be finite (not inf or nan). */

1003

if (type)

1004

*type = Py_DTST_FINITE;

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1005

1006

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1007

/* We got digits back, format them. We may need to pad 'digits'

1008

either on the left or right (or both) with extra zeros, so in

1009

general the resulting string has the form

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1010

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1011

[<sign>]<zeros><digits><zeros>[<exponent>]

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1012

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1013

where either of the <zeros> pieces could be empty, and there's a

1014

decimal point that could appear either in <digits> or in the

1015

leading or trailing <zeros>.

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1016

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1017

Imagine an infinite 'virtual' string vdigits, consisting of the

1018

string 'digits' (starting at index 0) padded on both the left and

1019

right with infinite strings of zeros. We want to output a slice

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1020

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1021

vdigits[vdigits_start : vdigits_end]

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1022

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1023

of this virtual string. Thus if vdigits_start < 0 then we'll end

1024

up producing some leading zeros; if vdigits_end > digits_len there

1025

will be trailing zeros in the output. The next section of code

1026

determines whether to use an exponent or not, figures out the

1027

position 'decpt' of the decimal point, and computes 'vdigits_start'

1028

and 'vdigits_end'. */

1029

vdigits_end = digits_len;

1030

switch (format_code) {

1031

case 'e':

1032

use_exp = 1;

1033

vdigits_end = precision;

1034

break;

1035

case 'f':

1036

vdigits_end = decpt + precision;

1037

break;

1038

case 'g':

1039

if (decpt <= -4 || decpt >

1040

(add_dot_0_if_integer ? precision-1 : precision))

1041

use_exp = 1;

1042

if (use_alt_formatting)

1043

vdigits_end = precision;

1044

break;

1045

case 'r':

1046

/* convert to exponential format at 1e16. We used to convert

1047

at 1e17, but that gives odd-looking results for some values

1048

when a 16-digit 'shortest' repr is padded with bogus zeros.

1049

For example, repr(2e16+8) would give 20000000000000010.0;

1050

the true value is 20000000000000008.0. */

1051

if (decpt <= -4 || decpt > 16)

use_exp = 1;

break;

default:

PyErr_BadInternalCall();

1056

goto exit;

1057

}

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1058

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1059

/* if using an exponent, reset decimal point position to 1 and adjust

1060

exponent accordingly.*/

1061

if (use_exp) {

Victor Stinner

7b25135

2013-06-24 23:37:40 +0200

[diff] [blame]

1062

exp = (int)decpt - 1;

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1063

decpt = 1;

1064

}

1065

/* ensure vdigits_start < decpt <= vdigits_end, or vdigits_start <

1066

decpt < vdigits_end if add_dot_0_if_integer and no exponent */

1067

vdigits_start = decpt <= 0 ? decpt-1 : 0;

1068

if (!use_exp && add_dot_0_if_integer)

1069

vdigits_end = vdigits_end > decpt ? vdigits_end : decpt + 1;

1070

else

1071

vdigits_end = vdigits_end > decpt ? vdigits_end : decpt;

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1072

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1073

/* double check inequalities */

1074

assert(vdigits_start <= 0 &&

1075

0 <= digits_len &&

1076

digits_len <= vdigits_end);

1077

/* decimal point should be in (vdigits_start, vdigits_end] */

1078

assert(vdigits_start < decpt && decpt <= vdigits_end);

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1079

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1080

/* Compute an upper bound how much memory we need. This might be a few

1081

chars too long, but no big deal. */

1082

bufsize =

1083

/* sign, decimal point and trailing 0 byte */

1084

3 +

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1085

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1086

/* total digit count (including zero padding on both sides) */

1087

(vdigits_end - vdigits_start) +

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1088

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1089

/* exponent "e+100", max 3 numerical digits */

1090

(use_exp ? 5 : 0);

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1091

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1092

/* Now allocate the memory and initialize p to point to the start of

1093

it. */

1094

buf = (char *)PyMem_Malloc(bufsize);

if (buf == NULL) {

PyErr_NoMemory();

goto exit;

}

p = buf;

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1100

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1101

/* Add a negative sign if negative, and a plus sign if non-negative

1102

and always_add_sign is true. */

1103

if (sign == 1)

1104

*p++ = '-';

1105

else if (always_add_sign)

1106

*p++ = '+';

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1107

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1108

/* note that exactly one of the three 'if' conditions is true,

1109

so we include exactly one decimal point */

1110

/* Zero padding on left of digit string */

1111

if (decpt <= 0) {

1112

memset(p, '0', decpt-vdigits_start);

1113

p += decpt - vdigits_start;

1114

*p++ = '.';

1115

memset(p, '0', 0-decpt);

p += 0-decpt;

}

else {

memset(p, '0', 0-vdigits_start);

1120

p += 0 - vdigits_start;

1121

}

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1122

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1123

/* Digits, with included decimal point */

1124

if (0 < decpt && decpt <= digits_len) {

1125

strncpy(p, digits, decpt-0);

1126

p += decpt-0;

1127

*p++ = '.';

1128

strncpy(p, digits+decpt, digits_len-decpt);

1129

p += digits_len-decpt;

1130

}

1131

else {

1132

strncpy(p, digits, digits_len);

1133

p += digits_len;

1134

}

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1135

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1136

/* And zeros on the right */

1137

if (digits_len < decpt) {

1138

memset(p, '0', decpt-digits_len);

1139

p += decpt-digits_len;

1140

*p++ = '.';

1141

memset(p, '0', vdigits_end-decpt);

1142

p += vdigits_end-decpt;

1143

}

1144

else {

1145

memset(p, '0', vdigits_end-digits_len);

1146

p += vdigits_end-digits_len;

1147

}

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1148

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1149

/* Delete a trailing decimal pt unless using alternative formatting. */

1150

if (p[-1] == '.' && !use_alt_formatting)

1151

p--;

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1152

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1153

/* Now that we've done zero padding, add an exponent if needed. */

1154

if (use_exp) {

1155

*p++ = float_strings[OFS_E][0];

1156

exp_len = sprintf(p, "%+.02d", exp);

1157

p += exp_len;

1158

}

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1159

exit:

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1160

if (buf) {

1161

*p = '\0';

1162

/* It's too late if this fails, as we've already stepped on

1163

memory that isn't ours. But it's an okay debugging test. */

1164

assert(p-buf < bufsize);

1165

}

1166

if (digits)

1167

_Py_dg_freedtoa(digits);

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1168

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1169

return buf;

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

}

PyAPI_FUNC(char *) PyOS_double_to_string(double val,

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

char format_code,

int precision,

int flags,

int *type)

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1178

{

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1179

char **float_strings = lc_float_strings;

1180

int mode;

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1181

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1182

/* Validate format_code, and map upper and lower case. Compute the

1183

mode and make any adjustments as needed. */

1184

switch (format_code) {

1185

/* exponent */

1186

case 'E':

1187

float_strings = uc_float_strings;

format_code = 'e';

/* Fall through. */

case 'e':

mode = 2;

precision++;

break;

Eric Smith

2009-04-16 22:08:31 +0000

[diff] [blame]

1194

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1195

/* fixed */

1196

case 'F':

1197

float_strings = uc_float_strings;

format_code = 'f';

/* Fall through. */

case 'f':

mode = 3;

break;

Eric Smith

2009-04-16 22:08:31 +0000

[diff] [blame]

1203

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1204

/* general */

1205

case 'G':

1206

float_strings = uc_float_strings;

format_code = 'g';

/* Fall through. */

case 'g':

mode = 2;

/* precision 0 makes no sense for 'g' format; interpret as 1 */

1212

if (precision == 0)

1213

precision = 1;

1214

break;

Eric Smith

2009-04-16 22:08:31 +0000

[diff] [blame]

1215

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

/* repr format */

case 'r':

mode = 0;

/* Supplied precision is unused, must be 0. */

1220

if (precision != 0) {

1221

PyErr_BadInternalCall();

1222

return NULL;

1223

}

1224

break;

Eric Smith

2009-04-16 22:08:31 +0000

[diff] [blame]

1225

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1226

default:

1227

PyErr_BadInternalCall();

1228

return NULL;

1229

}

Eric Smith

2009-04-16 20:16:10 +0000

[diff] [blame]

1230

Antoine Pitrou

2010-05-09 15:52:27 +0000

[diff] [blame]

1231

return format_float_short(val, format_code, mode, precision,

1232

flags & Py_DTSF_SIGN,

1233

flags & Py_DTSF_ADD_DOT_0,

1234

flags & Py_DTSF_ALT,

1235

float_strings, type);

Eric Smith