import string

string.punctuation

'!"#$%&\'()*+,-./:;<=>?@[\\]^_`{|}~'

PUNCTUATION = set(string.punctuation)

def remove_punctuation_set(s):
    return "".join(c for c in s if c not in PUNCTUATION)

TEST_STRING = "Hello world! How are you? I'm good, hope you are too!"

remove_punctuation_set(TEST_STRING)

'Hello world How are you Im good hope you are too'

import re

re.escape(string.punctuation)

'!"\\#\\$%\\&\'\\(\\)\\*\\+,\\-\\./:;<=>\\?@\\[\\\\\\]\\^_`\\{\\|\\}\\~'

PATTERN = re.compile(f"[{re.escape(string.punctuation)}]")

def remove_punctuation_regex(s):
    return PATTERN.sub("", s)

remove_punctuation_regex(TEST_STRING)

'Hello world How are you Im good hope you are too'

ord("a"), ord("b"), ord("c")

(97, 98, 99)

chr(97), chr(98), chr(99)

('a', 'b', 'c')

"hebbo worbd!".translate(
    {
        ord("b"): ord("l"),
        ord("!"): None,  # mapping to None removes the character
    }
)

'hello world'

PUNCTUATION_MAPPING = {ord(c): None for c in string.punctuation}


def remove_punctuation_translate(s):
    return s.translate(PUNCTUATION_MAPPING)

remove_punctuation_translate(TEST_STRING)

'Hello world How are you Im good hope you are too'

table = str.maketrans("b", "l", "!")

"hebbo worbd".translate(table)

'hello world'

assert str.maketrans("", "", string.punctuation) == PUNCTUATION_MAPPING

import timeit

n = 1_000_000

set_time = timeit.timeit(
    "remove_punctuation_set(TEST_STRING)",
    globals=globals(),
    number=n,
)

regex_time = timeit.timeit(
    "remove_punctuation_regex(TEST_STRING)",
    globals=globals(),
    number=n,
)

translate_time = timeit.timeit(
    "remove_punctuation_translate(TEST_STRING)",
    globals=globals(),
    number=n,
)

print(f"set      : {set_time}")
print(f"regex    : {regex_time}")
print(f"translate: {translate_time}")

set      : 2.3104199539998262
regex    : 0.9609262190001573
translate: 0.8181181009999818

What's the best way to strip punctuation from a string in Python?¶