39 lines
		
	
	
		
			1015 B
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			39 lines
		
	
	
		
			1015 B
		
	
	
	
		
			Python
		
	
	
	
	
	
| # -*- coding: utf-8 -*-
 | |
| from datetime import datetime
 | |
| import hashlib
 | |
| import os
 | |
| import re
 | |
| import struct
 | |
| 
 | |
| def sanitize(string, ignore_characters=None):
 | |
|     """Sanitize a string to strip special characters.
 | |
| 
 | |
|     :param str string: the string to sanitize.
 | |
|     :param set ignore_characters: characters to ignore.
 | |
|     :return: the sanitized string.
 | |
|     :rtype: str
 | |
| 
 | |
|     """
 | |
|     # only deal with strings
 | |
|     if string is None:
 | |
|         return
 | |
| 
 | |
|     ignore_characters = ignore_characters or set()
 | |
| 
 | |
|     # replace some characters with one space
 | |
|     # characters = {'-', ':', '(', ')', '.'} - ignore_characters
 | |
|     # if characters:
 | |
|     #     string = re.sub(r'[%s]' % re.escape(''.join(characters)), ' ', string)
 | |
| 
 | |
|     # remove some characters
 | |
|     characters = {'\''} - ignore_characters
 | |
|     if characters:
 | |
|         string = re.sub(r'[%s]' % re.escape(''.join(characters)), '', string)
 | |
| 
 | |
|     # replace multiple spaces with one
 | |
|     string = re.sub(r'\s+', ' ', string)
 | |
| 
 | |
|     # strip and lower case
 | |
|     return string.strip().lower()
 | |
| 
 |