Search
 
SCRIPT & CODE EXAMPLE
 

PYTHON

Split the string using the separator

# Split the string using the separator

text= "Orange,Apple,Grapes,WaterMelon,Kiwi"
print(text.split(','))
Comment

split strings around given separator/delimiter

# split strings around given separator/delimiter
# import Pandas as pd 
import pandas as pd 
   
# create a new data frame 
df = pd.DataFrame({'Location': ['Cupertino,California', 'Los Angles, California', 'Palo Alto, California']
                   }) 
   
df[['City','State']] = df.Location.str.split(',',expand=True) 
df
print(df)
Comment

split string into words and separators

def split_words_separators(an_input: str) -> list:
    """Returns two lists, one with words, and one with the separators used in input string"""
    merged = re.split(r"([ ,]+)", an_input)
    # the [::2] is to get the even indexes, which are the words
    # the [1::2] is to get the odd indexes, which are the separators
    return [merged[::2], merged[1::2]]
Comment

string split delimiter separated

import re
from collections import Counter

class analysedText(object):
    
    def __init__ (self, text):
        
        # format text, remove punctuation
        self.text = text       #declare a global variable, otherwise for loop will not save
        self.fmtText = self.text.lower()   #make text lower case

        #Remove special characters ',.!?' / Substring replacement        

        #loop implementation
        # chars_str = '.!,?'
        # for i in range(len(chars_str)):         #can't use len() alone b/c int obj is not iterable
        #     self.fmtText = self.fmtText.replace(chars_str[i], '')
            
        # list comprehension implementation
        # char_list = ['.', '!', ',', '?']
        # self.fmtText = ''.join(['' if i in char_list else i for i in self.fmtText])
        
        # list comprehension implementation (all inclusive)
        # self.fmtText = ''.join([i for i in self.fmtText if i.isalpha() or i.isspace()])
        
        #regular expression
        #replace all char not alphanumeric with ''
        self.fmtText = re.sub('[^A-Za-z0-9 ]', '', self.fmtText)
        
    def freqAll(self):        
        # Tokenizing a string and counting unique words - String tokenization 
        
        # Tokenize with string.split(), returns a list of delimiter separated words
        # wordList = self.fmtText.split(' ')
        
        # Tokenize with regular expression, re.split()
        wordList = re.split(r's', self.fmtText)
        
        # Use set() to filter out unique words
        # freqMap = {}  #create an empty dictionary with {}. Can't use it for set, use empty_set = set()
        # for word in set(wordList): # use set to remove duplicates in list
        #     freqMap[word] = wordList.count(word)
        # return freqMap          #returns a freqMap dictionary
        
        # Use Counter collection
        return Counter(wordList)
    
    def freqOf(self, word):
        # get frequency map
        freqDict = self.freqAll()
        
        return freqDict[word] if word in freqDict else 0
    
import sys

sampleMap = {'eirmod': 1,'sed': 1, 'amet': 2, 'diam': 5, 'consetetur': 1, 'labore': 1, 'tempor': 1, 'dolor': 1, 'magna': 2, 'et': 3, 'nonumy': 1, 'ipsum': 1, 'lorem': 2}

def testMsg(passed):
    if passed:                  #if True
       return 'Test Passed'
    else :
       return 'Test Failed'

print('Constructor: ')
try:
    samplePassage = analysedText('Lorem ipsum dolor! diam amet, consetetur Lorem magna. sed diam nonumy eirmod tempor. diam et labore? et diam magna. et diam amet.')
    print(testMsg(samplePassage.fmtText == 'lorem ipsum dolor diam amet consetetur lorem magna sed diam nonumy eirmod tempor diam et labore et diam magna et diam amet'))
except:
    print('Error detected. Recheck your function ' )
print('freqAll: ')
try:
    wordMap = samplePassage.freqAll()
    print(testMsg(wordMap==sampleMap))
except:
    print('Error detected. Recheck your function ' )
print('freqOf: ')
try:
    passed = True
    for word in sampleMap:
        if samplePassage.freqOf(word) != sampleMap[word]:
            passed = False
            break
    print(testMsg(passed))
    
except:
    print('Error detected. Recheck your function  ' )
Comment

PREVIOUS NEXT
Code Example
Python :: convert method to str python 
Python :: python test coverage 
Python :: fix the size of a deque python 
Python :: python delete key if exists 
Python :: dictionary multiple values per key 
Python :: github3 python 
Python :: python remove all occurrence of an items from list 
Python :: add legend to colorbar 
Python :: permutation and combination program in python 
Python :: python print bytes 
Python :: hexdigest python 
Python :: lower method in python 
Python :: += in python 
Python :: textrank python implementation 
Python :: declaring list size python 
Python :: python power of e 
Python :: web scraping with selenium 
Python :: discord py join and leave call 
Python :: two pointer function in python 
Python :: django url with slug 
Python :: remove first element from list python 
Python :: color reverse 
Python :: list vs tuple 
Python :: scrapy with selenium 
Python :: python number type 
Python :: or operator in python 
Python :: Syntax of Python Frozenset 
Python :: repeat string python 
Python :: python list extend 
Python :: self keyword in python 
ADD CONTENT
Topic
Content
Source link
Name
7+9 =