diff --git a/packages/text-to-speech/src/htmlToSsml.ts b/packages/text-to-speech/src/htmlToSsml.ts
index 7eb1e1924..9999e9f24 100644
--- a/packages/text-to-speech/src/htmlToSsml.ts
+++ b/packages/text-to-speech/src/htmlToSsml.ts
@@ -273,7 +273,7 @@ const textToUtterance = ({
voice?: string
isHtml?: boolean
}): Utterance => {
- const text = textItems.join('')
+ const text = stripEmojis(textItems.join(''))
let textWithWordOffset = text
if (isHtml) {
try {