Isaac Flath

from contextkit.read import read_url

def clean_post(content):
    parts = content.split('\n# ')
    result = '# ' + '\n# '.join(parts[1:])
    return result                       

fh_tutorial = clean_post(read_url('https://isaac.up.railway.app/blog/blog_post?fpath=posts%2FFasthtmlTutorial.ipynb'))
ms_scratch = clean_post(read_url('https://isaac.up.railway.app/blog/blog_post?fpath=posts%2FMeanShiftFromScratch.ipynb'))
py_tips = clean_post(read_url('https://isaac.up.railway.app/blog/blog_post?fpath=posts%2FPython.ipynb'))
bas_test = clean_post(read_url('https://isaac.up.railway.app/blog/blog_post?fpath=posts%2FBasicTesting.ipynb'))

import pandas as pd
from sentence_transformers import SentenceTransformer
import lancedb

posts = [fh_tutorial, ms_scratch, py_tips, bas_test]
blog_data = [{'title': post.split('\n')[0].replace('# ', ''), 'content': post} for post in posts]
df = pd.DataFrame(blog_data)
df

	title	content
0	Creating Custom FastHTML Tags for Markdown Ren...	# Creating Custom FastHTML Tags for Markdown R...
1	MeanShift From Scratch	# MeanShift From Scratch\n\nA deep dive on mea...
2	Python Programming Tips	# Python Programming Tips\n\nA list of handy t...
3	Introduction To Statistical Testing	# Introduction To Statistical Testing\n\nAn in...

model = SentenceTransformer("sentence-transformers/all-MiniLM-L6-v2")

df['vector'] = df['content'].apply(lambda x: model.encode(x, normalize_embeddings=True))

df.head()

	title	content	vector
0	Creating Custom FastHTML Tags for Markdown Ren...	# Creating Custom FastHTML Tags for Markdown R...	[-0.0600754, 0.07570859, 0.0017243278, 0.00696...
1	MeanShift From Scratch	# MeanShift From Scratch\n\nA deep dive on mea...	[0.022285162, -0.03508064, -0.006767927, -0.04...
2	Python Programming Tips	# Python Programming Tips\n\nA list of handy t...	[-0.017614271, -0.015829531, -0.044863362, 0.0...
3	Introduction To Statistical Testing	# Introduction To Statistical Testing\n\nAn in...	[-0.0035132996, -0.026535656, -0.10052579, 0.0...

db = lancedb.connect("./lancedb-tutorial")
table = db.create_table("blog_posts", data=df ,mode="overwrite")

query = "How do I make web components?" # Get a query
query_embedding = model.encode(query) # Create an embedding of it
query_embedding.shape, query_embedding[:3] # 384 numbers representing the query

results = table.search(query_embedding).metric('cosine').to_pandas()
results['_distance']

for _, row in results.iterrows():
    print(f"Post: {row['title']}")
    print(f"Distance: {row['_distance']:.2f}")

Post: Creating Custom FastHTML Tags for Markdown Rendering
Distance: 0.59
Post: Python Programming Tips
Distance: 0.81
Post: Introduction To Statistical Testing
Distance: 0.95
Post: MeanShift From Scratch
Distance: 0.98

assert not 'web component' in fh_tutorial.lower()

def chunk_by_markdown_sections(markdown_text, min_length=250):
    """Split markdown text into chunks based on header sections."""
    lines = markdown_text.split('\n')
    chunks = []
    current_chunk = []
    current_title = "Introduction"
    
    for line in lines:
        if line.startswith('#'):  # New header found
            # Save previous chunk if it's substantial
            if current_chunk and len('\n'.join(current_chunk)) >= min_length:
                chunks.append({'title': current_title, 'content': '\n'.join(current_chunk)})
            
            # Start new chunk
            current_title = line.lstrip('# ')
            current_chunk = [line]
        else:
            current_chunk.append(line)
    
    # Add the final chunk if it exists and meets length requirement
    if current_chunk and len('\n'.join(current_chunk)) >= min_length:
        chunks.append({'title': current_title, 'content': '\n'.join(current_chunk)})
    
    return chunks

chunk_by_markdown_sections("""# Markdown\n# Chunked\n## Based on markdown\n## Headers for RAG""", min_length=1)

all_chunks = []
for i, row in df.iterrows():
    for chunk in chunk_by_markdown_sections(row['content']):
        all_chunks.append({
            'post_title': row['title'], 
            'chunk_title': chunk['title'],
            'content': chunk['content'],
            'vector': model.encode(chunk['content'], normalize_embeddings=True)})

# Create DataFrame with all chunks
chunks_df = pd.DataFrame(all_chunks)

for i,r in chunks_df.iterrows():
    print(r.content)
    print("-----\n")
    if i==2: break

# Intro

This post will cover how to render markdown using zero-md in FastHTML in a practical example. This includes:

  * Defining a custom HTML tag in FastHTML
  * Using external CSS and javascript libraries with FastHTML
  * Adding CSS styling
  * Organize UI into columns

In this tutorial we will convert a markdown of an early lesson in the boot.dev curriculum and a fake conversation between a student and a chatbot about the lesson to HTML. Boot.dev is an online learning platform that offers self-paced, gamified courses for back-end web development.

-----

# Markdown With Zero-md

[code]

    # Import style 1 
    from fasthtml.common import *
    from functools import partial
    
    # Import style 2
    from fasthtml.core import P, Script, Html, Link, Div, Template, Style, to_xml
    from fasthtml.components import show
[/code]

In FastHTML we can use the `P` function to put text in a paragraph `<p></p>` tag (a common way of displaying text). However, markdown is not rendered properly and is hard to read!

While text can be read without styling, markdown has headers, code, bullets and other elements. So we need something more than just a regular text rendering.

We need to convert markdown formatting into a format that HTML understands. We can use a javascript library called zero-md to do this, but this tag does not have a function in FastHTML. There are still two options for using this tag in FastHTML.

> ### 💡 What is zero-md?
>
> In web development, HTML defines the general structure of a web page. However, HTML alone is usually not sufficient. Javascript allows us to extend what we can do beyond out-of-the-box HTML. `zero-md` is a Javascript library that adds functionality for displaying markdown content that we can use with an HTML tag.

The first option is to write the HTML in a text string and use that.

[code]

    NotStr(f'''<zero-md><script type="text/markdown">{lesson_content}</script></zero-md>''')
    
[/code]

> ### 💡 Tip
>
> `NotStr` is a FastHTML function designed for passing a string that should be executed as HTML code rather than a string. In the example above, because `NotStr` is used, FastHTML will treat it as HTML code rather than a Python string. If we removed the `NotStr`, all the HTML tags would be displayed on the page just as they are written rather than being rendered nicely for your web application.

This is fine for very simple things, but the more you build, the messier and harder it gets to work with. It is better to create a FastHTML style tag that works just like everything else. It's incredibly simple to create a custom tag. By importing from `fasthtml.components` the HTML tag will be created automatically (defined in the module's `__getattr__`).

[code]

    from fasthtml.components import Zero_md
[/code]

Now that we have our custom tag defined, we can use that with the `<script>` tag (included in FastHTML) to apply the formatting per the zero-md documentation. For now, we will use the defaults and do nothing with CSS (more details on this later).

[code]

    def render_local_md(md, css = ''):
        css_template = Template(Style(css), data_append=True)
        return Zero_md(css_template, Script(md, type="text/markdown"))
    
    lesson_content_html = render_local_md(lesson_content)
    print(to_xml(lesson_content_html))
[/code]

[code]

    <zero-md><template data-append>    <style></style>
    </template><script type="text/markdown"># Startup bug
    
    A new startup has a bug in its server code. The code is supposed to print messages indicating the server has started successfully.
    
    ## Challenge
    
    Fix the 2 errors in the code and get it to run!
    
    ```python
    print(&quot;Starting up server...&#x27;)
    prnt(&quot;local server is listening on port 8080&quot;)
    ```</script></zero-md>
    
[/code]

The last thing we need to do is load zero-md from a CDN. We can do this by adding a `<script>` tag to the `<head>` of the HTML, and it all works!

[code]

    with open('static/_readme.md') as f: lesson_content = f.read()
    
    zeromd_headers = [Script(type="module", src="https://cdn.jsdelivr.net/npm/zero-md@3?register")]
[/code]

`Html(*zeromd_headers, lesson_content_html)`

-----

# Markdown Conversation Bubbles

We will start with default DaisyUI chat bubbles. For many types of conversations this is fine, but for this use case we need markdown to render properly for code snippets and structural elements.

> ### 💡 Note
>
> This part of the tutorial picks up where the step-by-step the DaisyUI example in the FastHTML documentation leaves off. For more information, start there!
[code]

    #loading messages
    import json
    with open('static/conversation.json') as f:
        messages = json.load(f)['messages']
[/code]

[code]

    # Loading tailwind and daisyui
    chat_headers = [Script(src="https://cdn.tailwindcss.com"),
               Link(rel="stylesheet", href="https://cdn.jsdelivr.net/npm/daisyui@4.11.1/dist/full.min.css")]
[/code]

We re-use the code from the daisyUI example with one change. We are using the `render_local_md` function we defined.

[code]

    # Functionality identical to Daisy UI example linked above
    def ChatMessage(msg, render_md_fn=lambda x: x):
        md = render_md_fn(msg['content'])
        return Div(
            Div(msg['role'], cls="chat-header"),
            Div(md, cls=f"chat-bubble chat-bubble-{'primary' if msg['role'] == 'user' else 'secondary'}"),
            cls=f"chat chat-{'end' if msg['role'] == 'user' else 'start'}")
[/code]

Using this, markdown doesn't render properly, causing readability issues.

Instead let's do exactly what we did before with Zero-md. Our markdown renders, however there are some issues with css styles clashing.

[code]

    chat_bubble =Html(*(chat_headers+zeromd_headers), ChatMessage(messages[1], render_md_fn=render_local_md))
[/code]

We can inject CSS styling to handle this issue by telling zero-md to use a template and ignore the default styles to make beautiful properly rendered conversations.

> ### 💡 Tip
>
> CSS allows us to extend what we can do with just HTML by providing a syntax for adding styling to HTML elements in a programmatic way. You may want every header to have a specific text color or every paragraph to have a specific background color. CSS allows us to do that.
[code]

    css = '.markdown-body {background-color: unset !important; color: unset !important;}'
    _render_local_md = partial(render_local_md, css=css)
    chat_bubble = Html(*(chat_headers+zeromd_headers), ChatMessage(messages[1], render_md_fn=_render_local_md))
[/code]

Now that it looks good we can apply this style to all messages

-----

chunk_table = db.create_table("blog_chunks", data=chunks_df, mode="overwrite")

results = chunk_table.search(query_embedding).metric('cosine').to_pandas()

# Print results
for _, row in results.iterrows():
    print(f"Distance: {row['_distance']:.2f}")
    print(f"Post: {row['post_title']} : {row['chunk_title']}")
    print('---')
    if _==2: break

Distance: 0.63
Post: Creating Custom FastHTML Tags for Markdown Rendering : Intro
---
Distance: 0.64
Post: Creating Custom FastHTML Tags for Markdown Rendering : Putting it Together
---
Distance: 0.66
Post: Creating Custom FastHTML Tags for Markdown Rendering : Markdown With Zero-md
---

import bm25s
import numpy as np
from sklearn.preprocessing import normalize

tokenized_chunks = [doc.split() for doc in chunks_df['content']]

def hybrid_search(query, top_k=5, vector_weight=0.7):
    """Perform hybrid search using both vector similarity and BM25 keyword matching."""
    # Vector search
    query_embedding = model.encode(query, normalize_embeddings=True)
    vector_results = chunk_table.search(query_embedding).metric('cosine').limit(top_k*2).to_pandas()
    vector_results['vector_score'] = 1 - vector_results['_distance']
    
    # Keyword search with BM25s
    # Create corpus from our chunks
    corpus = chunks_df['content'].tolist()
    
    # Tokenize the corpus and index it
    corpus_tokens = bm25s.tokenize(corpus)
    retriever = bm25s.BM25(corpus=corpus)
    retriever.index(corpus_tokens)
    
    # Tokenize the query and retrieve results
    query_tokens = bm25s.tokenize(query)
    docs, scores = retriever.retrieve(query_tokens, k=len(corpus))  # Get scores for all documents
    
    # Map BM25 scores to our dataframe indices
    bm25_scores = {i: scores[0, idx] for idx, i in enumerate(docs[0])}
    vector_results['bm25_score'] = vector_results.index.map(
        lambda x: bm25_scores.get(x, 0) if x in bm25_scores else 0)
    
    # Normalize BM25 scores
    if vector_results['bm25_score'].max() > 0:
        vector_results['bm25_score'] = vector_results['bm25_score'] / vector_results['bm25_score'].max()
    
    # Combine scores with weighting
    vector_results['combined_score'] = (
        vector_weight * vector_results['vector_score'] + 
        (1 - vector_weight) * vector_results['bm25_score'])
    
    return vector_results.sort_values('combined_score', ascending=False).head(top_k)

query = "How do I make web components?"
results = hybrid_search(query, 6)

for _, row in results.iterrows():
    print(f"Post: {row['post_title']}")
    print(f"Section: {row['chunk_title']}")
    print(f"Relevance: {row['combined_score']:.2f}")
    print("---")
    if _==2: break

Split strings: 0%| | 0/66 [00:00<?, ?it/s]

BM25S Count Tokens: 0%| | 0/66 [00:00<?, ?it/s]

BM25S Compute Scores: 0%| | 0/66 [00:00<?, ?it/s]

Split strings: 0%| | 0/1 [00:00<?, ?it/s]

BM25S Retrieve: 0%| | 0/1 [00:00<?, ?it/s]

Post: Creating Custom FastHTML Tags for Markdown Rendering
Section: Intro
Relevance: 0.26
---
Post: Creating Custom FastHTML Tags for Markdown Rendering
Section: Putting it Together
Relevance: 0.25
---
Post: Creating Custom FastHTML Tags for Markdown Rendering
Section: Markdown With Zero-md
Relevance: 0.24
---

from rerankers import Reranker
ranker = Reranker('cross-encoder', model='mixedbread-ai/mxbai-rerank-base-v1',verbose=False)

Loading default cross-encoder model for language en
Warning: Model type could not be auto-mapped with the defaults list. Defaulting to TransformerRanker.
If your model is NOT intended to be ran as a one-label cross-encoder, please reload it and specify the model_type! Otherwise, you may ignore this warning. You may specify `model_type='cross-encoder'` to suppress this warning in the future.

def search_blog_posts(query, top_k=3):
    "Search blog posts using hybrid search followed by cross-encoder reranking"
    # Get candidates with hybrid search
    candidates = hybrid_search(query, top_k=top_k*2)
    
    # Rerank candidates
    texts = candidates['content'].tolist()
    doc_ids = candidates.index.tolist()
    ranked = ranker.rank(query=query, docs=texts, doc_ids=doc_ids)
    
    # Map scores back to candidates and return top results
    candidates['rerank_score'] = candidates.index.map(
        {r.document.doc_id: r.score for r in ranked.results}.get)
    return candidates.sort_values('rerank_score', ascending=False).head(top_k)

query = "How do I make web components?"
results = search_blog_posts(query)

for _, row in results.iterrows():
    print(f"Post: {row['post_title']}")
    print(f"Section: {row['chunk_title']}")
    print(f"Relevance: {row['rerank_score']:.2f}")
    print("---")

Post: Creating Custom FastHTML Tags for Markdown Rendering
Section: Putting it Together
Relevance: 0.01
---
Post: Creating Custom FastHTML Tags for Markdown Rendering
Section: Markdown With Zero-md
Relevance: -1.34
---
Post: Creating Custom FastHTML Tags for Markdown Rendering
Section: Markdown Conversation Bubbles
Relevance: -2.31
---

Retrieval 101

Contents

The Challenge of Finding Relevant Content

What This Post Will Deliver

Vector Embeddings: The Key to Semantic Search

Initial Solution Attempt: Setting Up LanceDB

Why the Initial Approach Isn't Enough

Chunking

Hybrid Search

Re-ranking

Key Takeaways and Principles

Next Steps

Extend Your Implementation

Resources for Further Learning

Join the Conversation

Stay Updated

Contents

Let's Connect