mbuali
/

Llama-3.1-8B-DALv0.1

Text Generation

Model card Files Files and versions Community

Llama-3.1-8B-DALv0.1 / venv /lib /python3.12 /site-packages /mistune /plugins /speedup.py

mbuali's picture

Upload folder using huggingface_hub

d1ceb73 verified 11 months ago

history blame contribute delete

1.07 kB

	import re
	import string

	# because mismatch is too slow, add parsers for paragraph and text

	HARD_LINEBREAK_RE = re.compile(r' \n\s')
	PARAGRAPH = (
	# start with none punctuation, not number, not whitespace
	r'(?:^[^\s\d' + re.escape(string.punctuation) + r'][^\n]*\n)+'
	)

	__all__ = ['speedup']



	def parse_text(inline, m, state):
	text = m.group(0)
	text = HARD_LINEBREAK_RE.sub('\n', text)
	inline.process_text(text, state)
	return m.end()


	def parse_paragraph(block, m, state):
	text = m.group(0)
	state.add_paragraph(text)
	return m.end()


	def speedup(md):
	"""Increase the speed of parsing paragraph and inline text."""
	md.block.register('paragraph', PARAGRAPH, parse_paragraph)

	punc = r'\\><!\[_*`~\^\$='
	text_pattern = r'[\s\S]+?(?=[' + punc + r']\|'
	if 'url_link' in md.inline.rules:
	text_pattern += 'https?:\|'

	if md.inline.hard_wrap:
	text_pattern += r' *\n\|'
	else:
	text_pattern += r' {2,}\n\|'

	text_pattern += r'$)'
	md.inline.register('text', text_pattern, parse_text)