#!/usr/bin/env python | |
# coding: utf-8 | |
# In[2]: | |
# # Function to process "double" followed by a number | |
# def process_doubles(sentence): | |
# tokens = sentence.split() | |
# result = [] | |
# i = 0 | |
# while i < len(tokens): | |
# if tokens[i] == "डबल": | |
# if i + 1 < len(tokens): | |
# result.append(tokens[i + 1]) | |
# result.append(tokens[i + 1]) | |
# i += 2 | |
# else: | |
# result.append(tokens[i]) | |
# i += 1 | |
# else: | |
# result.append(tokens[i]) | |
# i += 1 | |
# return ' '.join(result) | |
# In[ ]: | |
import re | |
def process_doubles(sentence): | |
# Use regex to split 'डबल' followed by numbers/words without space (e.g., "डबलवन" -> "डबल वन") | |
sentence = re.sub(r'(डबल)(\S+)', r'\1 \2', sentence) | |
tokens = sentence.split() | |
result = [] | |
i = 0 | |
while i < len(tokens): | |
if tokens[i] == "डबल": | |
if i + 1 < len(tokens): | |
result.append(tokens[i + 1]) # Append the next word/number | |
result.append(tokens[i + 1]) # Append the next word/number again to duplicate | |
i += 2 # Skip over the next word since it's already processed | |
else: | |
result.append(tokens[i]) | |
i += 1 | |
else: | |
result.append(tokens[i]) | |
i += 1 | |
return ' '.join(result) | |