Hướng dẫn dùng sliceworks python

import argparse

parser = argparse.ArgumentParser[]
parser.add_argument['-c', '--com-port', metavar='N', type=int, required=True, help='HART modem com port']
parser.add_argument['-s', '--slave-address', metavar='N', type=int, default=0, help='HART slave address']
parser.add_argument['-l', '--log', action='store_true', help='log to file']
parser.add_argument['-v', '--verbose', action='store_true', help='print values to console']
args = parser.parse_args[]

logger = setup_logging[args.verbose, args.log]

# picking up piece of string between separators
# function using partition, like partition, but drops the separators
def between[left,right,s]:
    before,_,a = s.partition[left]
    a,_,after = a.partition[right]
    return before,a,after
s = "bla bla blaa data lsdjfasdjöf [important notice] 'Daniweb forum' tcha tcha tchaa"
print between['','',s]
print between['[',']',s]
print between["'","'",s]
""" Output:
['bla bla blaa ', 'data', " lsdjfasdj\xc3\xb6f [important notice] 'Daniweb forum' tcha tcha tchaa"]
['bla bla blaa data lsdjfasdj\xc3\xb6f ', 'important notice', " 'Daniweb forum' tcha tcha tchaa"]
['bla bla blaa data lsdjfasdj\xc3\xb6f [important notice] ', 'Daniweb forum', ' tcha tcha tchaa']

import re

text = 'this is a text'

    found = re.search['is[.+?]text', text].group[1]
except AttributeError:
    # AAA, ZZZ not found in the original string
    found = '0 wtitle' # apply your error handling

=> a

# To get more than 1 search
job_title = []
for i in range[0,9282]:
    text = data.work_experiences.iloc[i]
        title = re.findall[r"wtitle [.*?] wcompany",text]
    except :
        title = 'onejob'
data['job_title'] = job_title

# best way
data['resume'] = data[['Resume_title', 'City', 'State', 'Description', 'work_experiences', 'Educations', 'Skills', 'Certificates', 'Additional Information']].agg[' '.join, axis=1]

# other way
df["period"] = df["Year"] + df["quarter"]
df['Period'] = df['Year'] + ' ' + df['Quarter']
df["period"] = df["Year"].astype[str] + df["quarter"] #If one [or both] of the columns are not string typed
#Beware of NaNs when doing this!
df['period'] = df[['Year', 'quarter', ...]].agg['-'.join, axis=1] #for multiple string columns
df['period'] = df[['Year', 'quarter']].apply[lambda x: ''.join[x], axis=1]
#method cat[] of the .str accessor 
df['Period'] = df.Year.str.cat[df.Quarter]
df['Period'] = df.Year.astype[str].str.cat[df.Quarter.astype[str], sep='q']
df['AllTogether'] = df['Country'].str.cat[df[['State', 'City']], sep=' - '] #add parameter na_rep to replace the NaN values with a string if have nan
columns = ['whatever', 'columns', 'you', 'choose']
df['period'] = df[columns].astype[str].sum[axis=1]

#a function
def str_join[df, sep, *cols]:
   ...:     from functools import reduce
   ...:     return reduce[lambda x, y: x.astype[str].str.cat[y.astype[str], sep=sep], 
   ...:                   [df[col] for col in cols]]

In [4]: df['cat'] = str_join[df, '-', 'c0', 'c1', 'c2', 'c3']

import pandas as pd

data = {'Product': ['Desktop Computer','Tablet','Printer','Laptop'],
        'Price': [850,200,150,1300]

df = pd.DataFrame[data, columns= ['Product', 'Price']]

df.to_csv[r'Path where you want to store the exported CSV file\File Name.csv']
# df.to_csv['file_name.csv', encoding='utf-8', index=False]
print [df]

df = pd.DataFrame[]
for i in range[]:

for c in df_drop.columns:
    df_drop[c] = df_drop[c].str.replace['[^\w\s]+', '']
df_drop = df_drop.astype[str]

rmsval = df.loc[:, 'c1':'c4']
def getrms[row]:  
  a = np.sqrt[sum[row**2/4]]
  return a
df['rms'] = df.apply[getrms,axis=1]

all_filenames = glob.glob["/home/lynaza/Desktop/Quinn/lda/檢察官起訴書/*.txt"]

#return only filename [may contain not only duoi file]
 import os
 arr = os.listdir["/home/lynaza/Desktop/Quinn/lda/檢察官起訴書"]

import cv2
import os
import glob

def load_images_name[path]:
    list_1 = glob.glob[path+'/*.tif'] # depth of 1 folder
    list_2 = glob.glob[path+'/*/*.tif'] # depth of 2 folder
    list_3 = glob.glob[path+'/*/*/*.tif']  # depth of 3 folder
    list_4 = glob.glob[path+'/*/*/*/*.tif']  # depth of 4 folder
    images_path = list_1 +list_2 +list_3 + list_4

    return images_path

images = load_images_name["/home/lynaza/Desktop/traindata/test"]

from google.colab import drive
import sys
train_df = pd.read_csv["/content/drive/MyDrive/train.csv"]

for idx in range[num]:
    # Print the first 16 most representative topics
    print["Topic #%s:" % idx, lda_model.print_topic[idx, 6]]

# //www.dataquest.io/blog/tutorial-time-series-analysis-with-pandas/
df['TIME'] =  pd.to_datetime[df['Time'],unit='s']
df_time = df.set_index['TIME']
# Add columns with year, month, and Weekday Name
df_time['Year'] = df_time.index.year
df_time['Month'] = df_time.index.month
df_time['Weekday Name'] = df_time.index.weekday_name

# Display a random sampling of 5 rows
df_time.sample[5, random_state=0]

# Visualizing time series data
sns.set[rc={'figure.figsize':[11, 4]}]

#You can do it using GloVe library:

#Install it: 

!pip install glove_python

from glove import Corpus, Glove

#Creating a corpus object
corpus = Corpus[] 

#Training the corpus to generate the co-occurrence matrix which is used in GloVe
corpus.fit[lines, window=10]

glove = Glove[no_components=5, learning_rate=0.05] 
glove.fit[corpus.matrix, epochs=30, no_threads=4, verbose=True]

 #for Fasttext
 from gensim.models import FastText
from gensim.test.utils import common_texts  # some example sentences
['human', 'interface', 'computer']
model = FastText[vector_size=4, window=3, min_count=1]  # instantiate
model.train[sentences=common_texts, total_examples=len[common_texts], epochs=10]  # train
model2 = FastText[vector_size=4, window=3, min_count=1, sentences=common_texts, epochs=10]

import numpy as np
np.allclose[model.wv['computer'], model2.wv['computer']]

from gensim.test.utils import datapath
corpus_file = datapath['lee_background.cor']  # absolute path to corpus
model3 = FastText[vector_size=4, window=3, min_count=1]
model3.build_vocab[corpus_file=corpus_file]  # scan over corpus to build the vocabulary
total_words = model3.corpus_total_words  # number of words in the corpus
model3.train[corpus_file=corpus_file, total_words=total_words, epochs=5]

from gensim.utils import tokenize
from gensim import utils
class MyIter:
    def __iter__[self]:
        path = datapath['crime-and-punishment.txt']
        with utils.open[path, 'r', encoding='utf-8'] as fin:
            for line in fin:
                yield list[tokenize[line]]
model4 = FastText[vector_size=4, window=3, min_count=1]
total_examples = model4.corpus_count
model4.train[sentences=MyIter[], total_examples=total_examples, epochs=5]
from gensim.test.utils import get_tmpfile
fname = get_tmpfile["fasttext.model"]
model = FastText.load[fname]

# //radimrehurek.com/gensim/models/fasttext.html

# pip
pip install camelot-py
# conda
conda install -c conda-forge camelot-py
import camelot
tables = camelot.read_pdf['foo.pdf', pages='1', flavor='lattice']
tables.export['foo.csv', f='csv', compress=True]
tables[0].to_csv['foo.csv']  # to a csv file
print[tables[0].df]  # to a df

# from website
import pandas as pd
simpsons = pd.read_html['//en.wikipedia.org/wiki/List_of_The_Simpsons_episodes_[seasons_1%E2%80%9320]']
# getting the first 5 rows of the table "Season 1" [second table]

df = df[df['resume_ontology'].str.strip[].astype[bool]]                                                                                                            

cmt['time'] = pd.to_datetime[cmt['post_time']]
cmt_4 = cmt[[cmt['time'] >= '2022-02-01']]
#convert df back to string
cmt_4["time"] = cmt_4["time"].dt.strftime['%Y:%M:%D']

# import pandas
import pandas as pd
# read csv data
df1 = pd.read_csv['Student_data.csv']
df2 = pd.read_csv['Course_enrolled.csv']
Right_join = pd.merge[df1, 
                      on ='Name',
                      how ='right']

