pythonVSCode/pythonFiles/PythonTools/visualstudio_py_util.py at master · rmagee/pythonVSCode

History

625 lines (526 loc) · 22.2 KB

Raw

100

101

102

103

104

105

106

107

108

109

110

111

112

113

114

115

116

117

118

119

120

121

122

123

124

125

126

127

128

129

130

131

132

133

134

135

136

137

138

139

140

141

142

143

144

145

146

147

148

149

150

151

152

153

154

155

156

157

158

159

160

161

162

163

164

165

166

167

168

169

170

171

172

173

174

175

176

177

178

179

180

181

182

183

184

185

186

187

188

189

190

191

192

193

194

195

196

197

198

199

200

201

202

203

204

205

206

207

208

209

210

211

212

213

214

215

216

217

218

219

220

221

222

223

224

225

226

227

228

229

230

231

232

233

234

235

236

237

238

239

240

241

242

243

244

245

246

247

248

249

250

251

252

253

254

255

256

257

258

259

260

261

262

263

264

265

266

267

268

269

270

271

272

273

274

275

276

277

278

279

280

281

282

283

284

285

286

287

288

289

290

291

292

293

294

295

296

297

298

299

300

301

302

303

304

305

306

307

308

309

310

311

312

313

314

315

316

317

318

319

320

321

322

323

324

325

326

327

328

329

330

331

332

333

334

335

336

337

338

339

340

341

342

343

344

345

346

347

348

349

350

351

352

353

354

355

356

357

358

359

360

361

362

363

364

365

366

367

368

369

370

371

372

373

374

375

376

377

378

379

380

381

382

383

384

385

386

387

388

389

390

391

392

393

394

395

396

397

398

399

400

401

402

403

404

405

406

407

408

409

410

411

412

413

414

415

416

417

418

419

420

421

422

423

424

425

426

427

428

429

430

431

432

433

434

435

436

437

438

439

440

441

442

443

444

445

446

447

448

449

450

451

452

453

454

455

456

457

458

459

460

461

462

463

464

465

466

467

468

469

470

471

472

473

474

475

476

477

478

479

480

481

482

483

484

485

486

487

488

489

490

491

492

493

494

495

496

497

498

499

500

501

502

503

504

505

506

507

508

509

510

511

512

513

514

515

516

517

518

519

520

521

522

523

524

525

526

527

528

529

530

531

532

533

534

535

536

537

538

539

540

541

542

543

544

545

546

547

548

549

550

551

552

553

554

555

556

557

558

559

560

561

562

563

564

565

566

567

568

569

570

571

572

573

574

575

576

577

578

579

580

581

582

583

584

585

586

587

588

589

590

591

592

593

594

595

596

597

598

599

600

601

602

603

604

605

606

607

608

609

610

611

612

613

614

615

616

617

618

619

620

621

622

623

624

625

# Python Tools for Visual Studio

# Copyright(c) Microsoft Corporation

# Licensed under the Apache License, Version 2.0 (the License); you may not use

# this file except in compliance with the License. You may obtain a copy of the

# License at http://www.apache.org/licenses/LICENSE-2.0

# THIS CODE IS PROVIDED ON AN *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS

# OF ANY KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY

# IMPLIED WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,

# MERCHANTABLITY OR NON-INFRINGEMENT.

# See the Apache Version 2.0 License for specific language governing

# permissions and limitations under the License.

__author__ = "Microsoft Corporation <[email protected]>"

__version__ = "3.0.0.0"

# This module MUST NOT import threading in global scope. This is because in a direct (non-ptvsd)

# attach scenario, it is loaded on the injected debugger attach thread, and if threading module

# hasn't been loaded already, it will assume that the thread on which it is being loaded is the

# main thread. This will cause issues when the thread goes away after attach completes.

import imp

import os

import sys

import struct

# Import encodings early to avoid import on the debugger thread, which may cause deadlock

from encodings import utf_8, ascii

# WARNING: Avoid imports beyond this point, specifically on the debugger thread, as this may cause

# deadlock where the debugger thread performs an import while a user thread has the import lock

# Py3k compat - alias unicode to str, and xrange to range

try:

unicode

except:

unicode = str

try:

xrange

except:

xrange = range

if sys.version_info[0] >= 3:

def to_bytes(cmd_str):

return ascii.Codec.encode(cmd_str)[0]

else:

def to_bytes(cmd_str):

return cmd_str

def exec_code(code, file, global_variables):

'''Executes the provided code as if it were the original script provided

to python.exe. The functionality is similar to `runpy.run_path`, which was

added in Python 2.7/3.2.

The following values in `global_variables` will be set to the following

values, if they are not already set::

__name__ = '<run_path>'

__file__ = file

__package__ = __name__.rpartition('.')[0] # 2.6 and later

__cached__ = None # 3.2 and later

__loader__ = None # 3.3 and later

The `sys.modules` entry for ``__name__`` will be set to a new module, and

``sys.path[0]`` will be changed to the value of `file` without the filename.

Both values are restored when this function exits.

'''

original_main = sys.modules.get('__main__')

global_variables = dict(global_variables)

mod_name = global_variables.setdefault('__name__', '<run_path>')

mod = sys.modules[mod_name] = imp.new_module(mod_name)

mod.__dict__.update(global_variables)

global_variables = mod.__dict__

global_variables.setdefault('__file__', file)

if sys.version_info[0] >= 3 or sys.version_info[1] >= 6:

global_variables.setdefault('__package__', mod_name.rpartition('.')[0])

if sys.version_info[0] >= 3:

if sys.version_info[1] >= 2:

global_variables.setdefault('__cached__', None)

if sys.version_info[1] >= 3:

try:

global_variables.setdefault('__loader__', original_main.__loader__)

except AttributeError:

pass

sys.path[0] = os.path.split(file)[0]

code_obj = compile(code, file, 'exec')

exec(code_obj, global_variables)

def exec_file(file, global_variables):

'''Executes the provided script as if it were the original script provided

to python.exe. The functionality is similar to `runpy.run_path`, which was

added in Python 2.7/3.2.

The following values in `global_variables` will be set to the following

values, if they are not already set::

__name__ = '<run_path>'

__file__ = file

__package__ = __name__.rpartition('.')[0] # 2.6 and later

__cached__ = None # 3.2 and later

__loader__ = sys.modules['__main__'].__loader__ # 3.3 and later

The `sys.modules` entry for ``__name__`` will be set to a new module, and

``sys.path[0]`` will be changed to the value of `file` without the filename.

Both values are restored when this function exits.

'''

f = open(file, "rb")

try:

code = f.read().replace(to_bytes('\r\n'), to_bytes('\n')) + to_bytes('\n')

finally:

f.close()

exec_code(code, file, global_variables)

def exec_module(module, global_variables):

'''Executes the provided module as if it were provided as '-m module'. The

functionality is implemented using `runpy.run_module`, which was added in

Python 2.5.

'''

import runpy

runpy.run_module(module, global_variables, run_name=global_variables.get('__name__'), alter_sys=True)

UNICODE_PREFIX = to_bytes('U')

ASCII_PREFIX = to_bytes('A')

NONE_PREFIX = to_bytes('N')

def read_bytes(conn, count):

b = to_bytes('')

while len(b) < count:

b += conn.recv(count - len(b))

return b

def write_bytes(conn, b):

conn.sendall(b)

def read_int(conn):

return struct.unpack('!q', read_bytes(conn, 8))[0]

def write_int(conn, i):

write_bytes(conn, struct.pack('!q', i))

def read_string(conn):

""" reads length of text to read, and then the text encoded in UTF-8, and returns the string"""

strlen = read_int(conn)

if not strlen:

return ''

res = to_bytes('')

while len(res) < strlen:

res = res + conn.recv(strlen - len(res))

res = utf_8.decode(res)[0]

if sys.version_info[0] == 2 and sys.platform != 'cli':

# Py 2.x, we want an ASCII string if possible

try:

res = ascii.Codec.encode(res)[0]

except UnicodeEncodeError:

pass

return res

def write_string(conn, s):

if s is None:

write_bytes(conn, NONE_PREFIX)

elif isinstance(s, unicode):

b = utf_8.encode(s)[0]

b_len = len(b)

write_bytes(conn, UNICODE_PREFIX)

write_int(conn, b_len)

if b_len > 0:

write_bytes(conn, b)

else:

s_len = len(s)

write_bytes(conn, ASCII_PREFIX)

write_int(conn, s_len)

if s_len > 0:

write_bytes(conn, s)

class SafeRepr(object):

# String types are truncated to maxstring_outer when at the outer-

# most level, and truncated to maxstring_inner characters inside

# collections.

maxstring_outer = 2 ** 16

maxstring_inner = 30

if sys.version_info >= (3, 0):

string_types = (str, bytes)

set_info = (set, '{', '}', False)

frozenset_info = (frozenset, 'frozenset({', '})', False)

else:

string_types = (str, unicode)

set_info = (set, 'set([', '])', False)

frozenset_info = (frozenset, 'frozenset([', '])', False)

# Collection types are recursively iterated for each limit in

# maxcollection.

maxcollection = (15, 10)

# Specifies type, prefix string, suffix string, and whether to include a

# comma if there is only one element. (Using a sequence rather than a

# mapping because we use isinstance() to determine the matching type.)

collection_types = [

(tuple, '(', ')', True),

(list, '[', ']', False),

frozenset_info,

set_info,

]

try:

from collections import deque

collection_types.append((deque, 'deque([', '])', False))

except:

pass

# type, prefix string, suffix string, item prefix string, item key/value separator, item suffix string

dict_types = [(dict, '{', '}', '', ': ', '')]

try:

from collections import OrderedDict

dict_types.append((OrderedDict, 'OrderedDict([', '])', '(', ', ', ')'))

except:

pass

# All other types are treated identically to strings, but using

# different limits.

maxother_outer = 2 ** 16

maxother_inner = 30

def __call__(self, obj):

try:

return ''.join(self._repr(obj, 0))

except:

try:

return 'An exception was raised: %r' % sys.exc_info()[1]

except:

return 'An exception was raised'

def _repr(self, obj, level):

'''Returns an iterable of the parts in the final repr string.'''

try:

obj_repr = type(obj).__repr__

except:

obj_repr = None

def has_obj_repr(t):

r = t.__repr__

try:

return obj_repr == r

except:

return obj_repr is r

for t, prefix, suffix, comma in self.collection_types:

if isinstance(obj, t) and has_obj_repr(t):

return self._repr_iter(obj, level, prefix, suffix, comma)

for t, prefix, suffix, item_prefix, item_sep, item_suffix in self.dict_types:

if isinstance(obj, t) and has_obj_repr(t):

return self._repr_dict(obj, level, prefix, suffix, item_prefix, item_sep, item_suffix)

for t in self.string_types:

if isinstance(obj, t) and has_obj_repr(t):

return self._repr_str(obj, level)

if self._is_long_iter(obj):

return self._repr_long_iter(obj)

return self._repr_other(obj, level)

# Determines whether an iterable exceeds the limits set in maxlimits, and is therefore unsafe to repr().

def _is_long_iter(self, obj, level = 0):

try:

# Strings have their own limits (and do not nest). Because they don't have __iter__ in 2.x, this

# check goes before the next one.

if isinstance(obj, self.string_types):

return len(obj) > self.maxstring_inner

# If it's not an iterable (and not a string), it's fine.

if not hasattr(obj, '__iter__'):

return False

# Iterable is its own iterator - this is a one-off iterable like generator or enumerate(). We can't

# really count that, but repr() for these should not include any elements anyway, so we can treat it

# the same as non-iterables.

if obj is iter(obj):

return False

# xrange reprs fine regardless of length.

if isinstance(obj, xrange):

return False

# numpy and scipy collections (ndarray etc) have self-truncating repr, so they're always safe.

try:

module = type(obj).__module__.partition('.')[0]

if module in ('numpy', 'scipy'):

return False

except:

pass

# Iterables that nest too deep are considered long.

if level >= len(self.maxcollection):

return True

# It is too long if the length exceeds the limit, or any of its elements are long iterables.

if hasattr(obj, '__len__'):

try:

l = len(obj)

except:

l = None

if l is not None and l > self.maxcollection[level]:

return True

return any((self._is_long_iter(item, level + 1) for item in obj))

return any(i > self.maxcollection[level] or self._is_long_iter(item, level + 1) for i, item in enumerate(obj))

except:

# If anything breaks, assume the worst case.

return True

def _repr_iter(self, obj, level, prefix, suffix, comma_after_single_element = False):

yield prefix

if level >= len(self.maxcollection):

yield '...'

else:

count = self.maxcollection[level]

yield_comma = False

for item in obj:

if yield_comma:

yield ', '

yield_comma = True

count -= 1

if count <= 0:

yield '...'

break

for p in self._repr(item, 100 if item is obj else level + 1):

yield p

else:

if comma_after_single_element and count == self.maxcollection[level] - 1:

yield ','

yield suffix

def _repr_long_iter(self, obj):

try:

obj_repr = '<%s, len() = %s>' % (type(obj).__name__, len(obj))

except:

try:

obj_repr = '<' + type(obj).__name__ + '>'

except:

obj_repr = '<no repr available for object>'

yield obj_repr

def _repr_dict(self, obj, level, prefix, suffix, item_prefix, item_sep, item_suffix):

if not obj:

yield prefix + suffix

return

if level >= len(self.maxcollection):

yield prefix + '...' + suffix

return

yield prefix

count = self.maxcollection[level]

yield_comma = False

try:

sorted_keys = sorted(obj)

except Exception:

sorted_keys = list(obj)

for key in sorted_keys:

if yield_comma:

yield ', '

yield_comma = True

count -= 1

if count <= 0:

yield '...'

break

yield item_prefix

for p in self._repr(key, level + 1):

yield p

yield item_sep

try:

item = obj[key]

except Exception:

yield '<?>'

else:

for p in self._repr(item, 100 if item is obj else level + 1):

yield p

yield item_suffix

yield suffix

def _repr_str(self, obj, level):

return self._repr_obj(obj, level, self.maxstring_inner, self.maxstring_outer)

def _repr_other(self, obj, level):

return self._repr_obj(obj, level, self.maxother_inner, self.maxother_outer)

def _repr_obj(self, obj, level, limit_inner, limit_outer):

try:

obj_repr = repr(obj)

except:

try:

obj_repr = object.__repr__(obj)

except:

try:

obj_repr = '<no repr available for ' + type(obj).__name__ + '>'

except:

obj_repr = '<no repr available for object>'

limit = limit_inner if level > 0 else limit_outer

if limit >= len(obj_repr):

yield obj_repr

return

# Slightly imprecise calculations - we may end up with a string that is

# up to 3 characters longer than limit. If you need precise formatting,

# you are using the wrong class.

left_count, right_count = max(1, int(2 * limit / 3)), max(1, int(limit / 3))

yield obj_repr[:left_count]

yield '...'

yield obj_repr[-right_count:]

def _selftest(self):

# Test the string limiting somewhat automatically

tests = []

tests.append((7, 9, 'A' * (5)))

tests.append((self.maxstring_outer + 3, self.maxstring_inner + 3 + 2, 'A' * (self.maxstring_outer + 10)))

if sys.version_info >= (3, 0):

tests.append((self.maxstring_outer + 4, self.maxstring_inner + 4 + 2, bytes('A', 'ascii') * (self.maxstring_outer + 10)))

else:

tests.append((self.maxstring_outer + 4, self.maxstring_inner + 4 + 2, unicode('A') * (self.maxstring_outer + 10)))

for limit1, limit2, value in tests:

assert len(self(value)) <= limit1 <= len(repr(value)), (len(self(value)), limit1, len(repr(value)), value)

assert len(self([value])) <= limit2 <= len(repr([value])), (len(self([value])), limit2, len(repr([value])), self([value]))

def test(source, expected):

actual = self(source)

if actual != expected:

print("Source " + repr(source))

print("Expect " + expected)

print("Actual " + actual)

print("")

assert False

def re_test(source, pattern):

import re

actual = self(source)

if not re.match(pattern, actual):

print("Source " + repr(source))

print("Pattern " + pattern)

print("Actual " + actual)

print("")

assert False

for ctype, _prefix, _suffix, comma in self.collection_types:

for i in range(len(self.maxcollection)):

prefix = _prefix * (i + 1)

if comma:

suffix = _suffix + ("," + _suffix) * i

else:

suffix = _suffix * (i + 1)

#print("ctype = " + ctype.__name__ + ", maxcollection[" + str(i) + "] == " + str(self.maxcollection[i]))

c1 = ctype(range(self.maxcollection[i] - 1))

inner_repr = prefix + ', '.join(str(j) for j in c1)

c2 = ctype(range(self.maxcollection[i]))

c3 = ctype(range(self.maxcollection[i] + 1))

for j in range(i):

c1, c2, c3 = ctype((c1,)), ctype((c2,)), ctype((c3,))

test(c1, inner_repr + suffix)

test(c2, inner_repr + ", ..." + suffix)

test(c3, inner_repr + ", ..." + suffix)

if ctype is set:

# Cannot recursively add sets to sets

break

# Assume that all tests apply equally to all iterable types and only

# test with lists.

c1 = list(range(self.maxcollection[0] * 2))

c2 = [c1 for _ in range(self.maxcollection[0] * 2)]

c1_expect = '[' + ', '.join(str(j) for j in range(self.maxcollection[0] - 1)) + ', ...]'

test(c1, c1_expect)

c1_expect2 = '[' + ', '.join(str(j) for j in range(self.maxcollection[1] - 1)) + ', ...]'

c2_expect = '[' + ', '.join(c1_expect2 for _ in range(self.maxcollection[0] - 1)) + ', ...]'

test(c2, c2_expect)

# Ensure dict keys and values are limited correctly

d1 = {}

d1_key = 'a' * self.maxstring_inner * 2

d1[d1_key] = d1_key

re_test(d1, "{'a+\.\.\.a+': 'a+\.\.\.a+'}")

d2 = {d1_key : d1}

re_test(d2, "{'a+\.\.\.a+': {'a+\.\.\.a+': 'a+\.\.\.a+'}}")

d3 = {d1_key : d2}

if len(self.maxcollection) == 2:

re_test(d3, "{'a+\.\.\.a+': {'a+\.\.\.a+': {\.\.\.}}}")

else:

re_test(d3, "{'a+\.\.\.a+': {'a+\.\.\.a+': {'a+\.\.\.a+': 'a+\.\.\.a+'}}}")

# Ensure empty dicts work

test({}, '{}')

# Ensure dict keys are sorted

d1 = {}

d1['c'] = None

d1['b'] = None

d1['a'] = None

test(d1, "{'a': None, 'b': None, 'c': None}")

if sys.version_info >= (3, 0):

# Ensure dicts with unsortable keys do not crash

d1 = {}

for _ in range(100):

d1[object()] = None

try:

list(sorted(d1))

assert False, "d1.keys() should be unorderable"

except TypeError:

pass

self(d1)

# Test with objects with broken repr implementations

class TestClass(object):

def __repr__(self):

raise NameError

try:

repr(TestClass())

assert False, "TestClass().__repr__ should have thrown"

except NameError:

pass

self(TestClass())

# Test with objects with long repr implementations

class TestClass(object):

repr_str = '<' + 'A' * self.maxother_outer * 2 + '>'

def __repr__(self):

return self.repr_str

re_test(TestClass(), r'\<A+\.\.\.A+\>')

# Test collections that don't override repr

class TestClass(dict): pass

test(TestClass(), '{}')

class TestClass(list): pass

test(TestClass(), '[]')

# Test collections that override repr

class TestClass(dict):

def __repr__(self): return 'MyRepr'

test(TestClass(), 'MyRepr')

class TestClass(list):

def __init__(self, iter = ()): list.__init__(self, iter)

def __repr__(self): return 'MyRepr'

test(TestClass(), 'MyRepr')

# Test collections and iterables with long repr

test(TestClass(xrange(0, 15)), 'MyRepr')

test(TestClass(xrange(0, 16)), '<TestClass, len() = 16>')

test(TestClass([TestClass(xrange(0, 10))]), 'MyRepr')

test(TestClass([TestClass(xrange(0, 11))]), '<TestClass, len() = 1>')

# Test strings inside long iterables

test(TestClass(['a' * (self.maxcollection[1] + 1)]), 'MyRepr')

test(TestClass(['a' * (self.maxstring_inner + 1)]), '<TestClass, len() = 1>')

# Test range

if sys.version[0] == '2':

range_name = 'xrange'

else:

range_name = 'range'

test(xrange(1, self.maxcollection[0] + 1), '%s(1, %s)' % (range_name, self.maxcollection[0] + 1))

# Test directly recursive collections

c1 = [1, 2]

c1.append(c1)

test(c1, '[1, 2, [...]]')

d1 = {1: None}

d1[2] = d1

test(d1, '{1: None, 2: {...}}')

# Find the largest possible repr and ensure it is below our arbitrary

# limit (8KB).

coll = '-' * (self.maxstring_outer * 2)

for limit in reversed(self.maxcollection[1:]):

coll = [coll] * (limit * 2)

dcoll = {}

for i in range(self.maxcollection[0]):

dcoll[str(i) * self.maxstring_outer] = coll

text = self(dcoll)

#try:

# text_repr = repr(dcoll)

#except MemoryError:

# print('Memory error raised while creating repr of test data')

# text_repr = ''

#print('len(SafeRepr()(dcoll)) = ' + str(len(text)) + ', len(repr(coll)) = ' + str(len(text_repr)))

assert len(text) < 8192

# Test numpy types - they should all use their native reprs, even arrays exceeding limits

try:

import numpy as np

except ImportError:

print('WARNING! could not import numpy - skipping all numpy tests.')

else:

test(np.int32(123), repr(np.int32(123)))

test(np.float64(123.456), repr(np.float64(123.456)))

test(np.zeros(self.maxcollection[0] + 1), repr(np.zeros(self.maxcollection[0] + 1)));

if __name__ == '__main__':

print('Running tests...')

SafeRepr()._selftest()

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

visualstudio_py_util.py

Latest commit

History

visualstudio_py_util.py

File metadata and controls