python APIs

python 备忘录

[TOC]

简单API

FUN: 重命名目录下文件

filter
lambda

def format_filename(dir):
    fs = os.listdir(dir)
    for f in fs:
        new_n = ''.join(filter(lambda ch: ch not in '# (){}#', f))
        print(f, ' ----> ', new_n)
        os.rename(dir+f, dir+new_n)

traceback

def log_error(e):
    print('err:', e)
    print('err:', request.form)
    print('err file:', e.__traceback__.tb_frame.f_globals["__file__"])  # 发生异常所在的文件
    print('err file line:', e.__traceback__.tb_lineno)  # 发生异常所在的行数
    print('err ', traceback.print_exc())

Time

>>> time.ctime()
'Thu May 5 14:58:09 2011'
>>> time.ctime(time.time())
'Thu May 5 14:58:39 2011'
>>> time.ctime(1304579615)
'Thu May 5 15:13:35 2011'

os

1	os.mkdir()

os.path

os.path.basename()

os.path.dirname()

path = '/home/User/Documents'
dirname = os.path.dirname(path)
print(dirname)


path = '/home/User/Documents/file.txt'
dirname = os.path.dirname(path)
print(dirname)


path = 'file.txt'
dirname = os.path.dirname(path)
print(dirname)

# 三个的结果：
>>>/home/User
>>>/home/User/Documents
>>>

expanduser

python的os.path 模块提供了一个expanduser函数，它可以将参数中开头部分的 ~ 或 ~user 替换为当前用户的home目录并返回，仅看定义难以理解，我在linux系统和winodws系统下分别实验它的功能。

在linux系统下，我的账号是kwsy，这个用户的home目录是/home/kwsy，下面的代码演示如何使用expanduser函数。

Python 3.7.0 (default, Jun 28 2018, 13:15:42)
[GCC 7.2.0] :: Anaconda, Inc. on linux
Type "help", "copyright", "credits" or "license" for more information.
>>> import os
>>> os.path.expanduser('~/.config/')
'/home/kwsy/.config/'

expandvars

Python中的方法用于扩展给定路径中的环境变量。它将给定路径中形式为 $name$ 或 ${name}$ 的子字符串替换为环境变量name的值。

todo

random

1	random.randint(0, N) -> one of [0,1, ...,N]

str

text = 'hello world'

# 1. in
if 'w' in text:
    print('find w in text')

if 'hello' in text:
    print('find')

if 'hello' not in text:
    print(' not find ')


# 2.find func
if text.find('xxx') != -1:
     print('find position=', text.find('xxx'))

# 3 index func
try:
    position = text.index('not exits char')
except ValueError:
    print('not find ')

dict_2_obj

自定义

class obj(object):
    def __init__(self, d):
        for a, b in d.items():
            if isinstance(b, (list, tuple)):
               setattr(self, a, [obj(x) if isinstance(x, dict) else x for x in b])
            else:
               setattr(self, a, obj(b) if isinstance(b, dict) else b)
d = {'a': 1, 'b': {'c': 2}, 'd': ["hi", {'foo': "cjavapy"}]}
o = obj(d)
print(o)
print(o.a)
print(o.b)
print(o.d)
print(o.d[1].foo)

json

import json
class obj(object):
    def __init__(self, dict_):
        self.__dict__.update(dict_)
def dict2obj(d):
    return json.loads(json.dumps(d), object_hook=obj)
d = {'a': 1, 'b': {'c': 2}, 'd': ['hi', {'foo': 'cjavapy'}]}
o = dict2obj(d)
print(o)
print(o.a)
print(o.b)
print(o.d)
print(o.d[1].foo)

namedtuple

from collections import namedtuple
class struct(object):
    def __new__(cls, data):
        if isinstance(data, dict):
            return namedtuple(
                'struct', data.keys()
            )(
                *(struct(val) for val in data.values())
            )
        elif isinstance(data, (tuple, list, set, frozenset)):
            return type(data)(struct(_) for _ in data)
        else:
            return data
d = {'a': 1, 'b': {'c': 2}, 'd': ['hi', {'foo': 'cjavapy'}]}
o = struct(d)
print(o)
print(o.a)
print(o.b)
print(o.d)
print(o.d[1].foo)

json

json.dumps()
json.loads()
import json

# json.dumps()函数的使用，将字典转化为字符串
dict1 = {"age": "12"}
json_info = json.dumps(dict1)

# Writing JSON data
with open('data.json', 'w') as f:
    json.dump(data, f)

# Reading data back
with open('data.json', 'r') as f:
    data = json.load(f)

np

import numpy as np

a=np.array(a)
np.save(‘a.npy’,a)   # 保存为.npy格式

1 2	a=np.load(‘a.npy’) a=a.tolist()

csv

import pandas as pd

readme = pd.read_csv(‘读我.txt’,sep=’:’,encoding=“utf-8”, engine=‘python’,header=None)
readme = np.array(readme)

高级API

组合函数 itertools.combinations()元素不可重复

1
2
3

itertools.combinations(iters,n)元组输出迭代器，需List显示，全组合直接append分三个元组。
combinations('ABCD', 2) --> AB AC AD BC BD CD
combinations(range(4), 3) --> 012 013 023 123

ref:组合blog

combinations

import itertools 
combinations2 = itertools.combinations(iterable, r)
for combo in combinations2: 
    print(combo)
(1, 2)
(1, 3)
(2, 3)

combinations_with_replacement() 元素可重复的组合

import itertools  

# 定义一个可迭代对象  
iterable = [1, 2, 3]  

# 设置组合长度为2  
r = 2  

# 生成可重复组合的迭代器  
combinations = itertools.combinations_with_replacement(iterable, r)  

# 打印每个组合  
for combo in combinations:  
    print(combo)

out

(1, 1)  
(1, 2)  
(1, 3)  
(2, 2)  
(2, 3)  
(3, 3)

@property的理解和使用

@property
def password(self):
    raise AttributeError('password is not a readable attribute')

@password.setter
def password(self, password):
    self.password_hash = generate_password_hash(password)

通常赋值函数

class Student(object):

    def get_score(self):
        return self._score

    def set_score(self, value):
        if not isinstance(value, int):
            raise ValueError('score must be an integer!')
        if value < 0 or value > 100:
            raise ValueError('score must between 0 ~ 100!')
        self._score = value


>>> s = Student()
>>> s.set_score(60) # ok!
>>> s.get_score()
60
>>> s.set_score(9999)
Traceback (most recent call last):
  ...
ValueError: score must between 0 ~ 100!

@property

但是为了方便,节省时间,我们不想写s.set_score(9999)啊,直接写s.score = 9999不是更快么,加了方法做限制不能让调用的时候变麻烦啊,@property快来帮忙….

class Student(object):

    @property
    def score(self):
        return self._score

    @score.setter
    def score(self,value):
        if not isinstance(value, int):
            raise ValueError('分数必须是整数才行呐')
        if value < 0 or value > 100:
            raise ValueError('分数必须0-100之间')
        self._score = value

看上面代码可知,把get方法变为属性只需要加上@property装饰器即可,此时@property本身又会创建另外一个装饰器@score.setter,负责把set方法变成给属性赋值,这么做完后,我们调用起来既可控又方便

>>> s = Student()
>>> s.score = 60 # OK，实际转化为s.set_score(60)
>>> s.score # OK，实际转化为s.get_score()
60
>>> s.score = 9999
Traceback (most recent call last):
  ...
ValueError: score must between 0 ~ 100!

MP

对于一般进程间共享数据来说，使用
multiprocessing.Manager().Value
和multiprocessing.Manager().list()
和multiprocessing.Manager().dict()即可。
Or:
Queue()

pyLint

# Install
pip install pylint
pylint --version

#使用,生成默认配置文件：
pylint --persistent=n --generate-rcfile > .pylintrc

# 检查单个文件：
pylint [options] m1.py

# 整个项目
pylint [options] project_path

re

去除中文标点符号

s = re.sub(r'[.,"\'-?:!;]', '', s)

去除中文

temp = re.sub('[\u4e00-\u9fa5]','',text)

去除英文

temp = re.sub('[a-zA-Z]','',text)

del数字

temp = re.sub('[\d]','',text) # [0-9]

del 空格

temp = re.sub('[\s]','',text) #temp = text.strip()

RUN

# 1 normal run
python -u main.py


# 2 subdir run
python demo/main.py
--修改main文件
import os, sys
sys.path.append(os.path.dirname(os.path.dirname(os.path.realpath(__file__))))


# 3 -m 运行
python -m model.main