KiwiSpeed - Python scripts that chart how fast a thread moves

my penis is on fire · Jul 31, 2025

Jason "Thor" Hall / PirateSoftware / Maldavius Figtree

Francis Joseph Benditt IV / FallenChungus / datsmojo

Alex Hogendorp / Lunar Eclipse Paradox

Troonslop "Retro" Games

Elon Reeve Musk

Introducing KiwiSpeed, a pair of Python scripts that can scrape a thread then make a cool chart of how fast the thread has moved. KiwiSpeedScraper.py steps through every page of a thread, collects the timestamps of every post, then saves them to a CSV file. KiwiSpeedChart.py reads that CSV file, then makes the PyPlot chart you see above.

Python:

# KIWISPEED SCRAPER
# Created by: my penis is on fire

import requests
from html.parser import HTMLParser
from datetime import datetime
import csv

## SETTINGS ##
thread_url = "https://kiwifarms.st/threads/elon-reeve-musk.134949/" # URL of Page 1 of thread to capture
pages = 694 # Number of pages this thread has
filename = "elonmusk.csv" # Name of output file (Must end in .csv)



class TimestampParser(HTMLParser):
    
    def __init__(self):
        super().__init__()
        self.timestamps = []
        self._in_lastedit = False
        self._in_embed = False
        self._embed_depth = 0

    def handle_starttag(self, tag, attrs):
        tag = tag.lower()
        attr_dict = {name.lower(): val for name, val in attrs}

        # Entering "last edited" block?
        if tag == 'div' and 'class' in attr_dict and 'message-lastEdit' in attr_dict['class']:
            self._in_lastedit = True
            return

        # Entering an embed block?
        if tag == 'div' and 'class' in attr_dict and 'fauxBlockLink' in attr_dict['class']:
            self._in_embed = True
            self._embed_depth = 1
            return

        # If already inside an embed, track nested divs
        if self._in_embed and tag == 'div':
            self._embed_depth += 1
            return

        # Parse <time> if not in an edit or embed
        if tag == 'time' and not self._in_lastedit and not self._in_embed:
            ts = None
            if 'title' in attr_dict:
                ts = attr_dict['title'].replace(',', '')
            # Parse ISO datetime and reformat for csv
            elif 'datetime' in attr_dict:
                iso = attr_dict['datetime']
                try:
                    dt = datetime.fromisoformat(iso)
                    ts = dt.strftime('%b %d %Y at %I:%M %p').replace(' 0', ' ')
                except ValueError:
                    ts = iso
            if ts:
                self.timestamps.append(ts)

    def handle_endtag(self, tag):
        tag = tag.lower()
        # Exiting embed blocks?
        if tag == 'div' and self._in_embed:
            self._embed_depth -= 1
            if self._embed_depth == 0:
                self._in_embed = False
            return

        # Exiting last‑edit block?
        if tag == 'div' and self._in_lastedit:
            self._in_lastedit = False

def get_timestamps_from_page(url):
    resp = requests.get(url)
    resp.raise_for_status()
    parser = TimestampParser()
    parser.feed(resp.text)
    return parser.timestamps[1:] # Removes first timestamp of when the OP was made

if __name__ == '__main__':
    all_stamps = []
    current_page = 1
    while current_page <= pages:
        try:
            print("Scraping page " + str(current_page) + " / " + str(pages) + "...")
            stamps = get_timestamps_from_page(thread_url + "page-" + str(current_page))
            if stamps:
                all_stamps.extend(stamps)
            else:
                print("No valid timestamps found on that page.")
            current_page += 1
                
        except requests.RequestException as e:
            print(f"Error fetching page: {e}")
    #print(all_stamps)
    
    with open(filename, 'w', newline='') as csvfile:
        csv_writer = csv.writer(csvfile)
        csv_writer.writerows([[ts] for ts in all_stamps])
    print(f"Data saved to {filename}")

Python:

# KIWISPEED CHART MAKER
# Created by: my penis is on fire

import csv
from datetime import datetime, timedelta
import matplotlib.pyplot as plt
import matplotlib.dates as mdates
from collections import Counter, OrderedDict

## SETTINGS ##
csv_filename = "elonmusk.csv" # csv must be in same directory as this script
final_plot_title = "Elon Reeve Musk"
ppd_ylim = 0 # Adjust height of Posts Per Day line. Set to 0 to auto-set.
show_cumulative = False # Optional individual charts.
show_per_day = False
show_per_week = False
show_per_month = False



timestamps = []
with open(csv_filename, newline='') as f:
    reader = csv.reader(f)
    header = next(reader)
    try:
        datetime.strptime(header[0], '%b %d %Y at %I:%M %p')
    except ValueError:
        pass
    else:
        timestamps.append(header[0])
    for row in reader:
        if row:
            timestamps.append(row[0])

dt_list = [datetime.strptime(ts, '%b %d %Y at %I:%M %p') for ts in timestamps]
dt_list.sort()

times = dt_list
counts = list(range(1, len(times) + 1))

plt.style.use('dark_background')
if show_cumulative:
    fig, ax = plt.subplots()
    ax.step(times, counts, where='post', color = "#6BA65E")
    ax.set_title('Cumulative Posts Over Time')
    ax.set_xlabel('Time')
    ax.set_ylabel('Posts')
    ax.xaxis.set_major_formatter(mdates.DateFormatter('%Y-%m-%d'))
    #plt.yscale('log')
    fig.autofmt_xdate()
    plt.tight_layout()


# Aggregate to weeks, months
def aggregate_counts(dt_list, freq):
    buckets = []
    for dt in dt_list:
        if freq == 'D':
            bucket = datetime(dt.year, dt.month, dt.day)
        elif freq == 'W':
            start = dt - timedelta(days=dt.weekday())  # Monday
            bucket = datetime(start.year, start.month, start.day)
        elif freq == 'M':
            bucket = datetime(dt.year, dt.month, 1)
        else:
            raise ValueError("freq must be one of 'D','W','M'")
        buckets.append(bucket)

    if not buckets:
        return OrderedDict()

    ctr = Counter(buckets)

    min_bucket = min(buckets)
    max_bucket = max(buckets)
    periods = []

    if freq == 'D':
        delta = timedelta(days=1)
        current = min_bucket
        while current <= max_bucket:
            periods.append(current)
            current += delta

    elif freq == 'W':
        delta = timedelta(weeks=1)
        current = min_bucket
        while current <= max_bucket:
            periods.append(current)
            current += delta

    elif freq == 'M':
        current = min_bucket
        while current <= max_bucket:
            periods.append(current)
            year = current.year + (current.month // 12)
            month = current.month % 12 + 1
            current = datetime(year, month, 1)

    ordered = OrderedDict((p, ctr.get(p, 0)) for p in periods)
    return ordered


daily = aggregate_counts(dt_list, 'D')
if show_per_day:
    fig, ax = plt.subplots()
    ax.plot(list(daily.keys()), list(daily.values()), marker='', color = "#6BA65E")
    ax.set_title('Posts per Day')
    ax.set_xlabel('Date')
    ax.set_ylabel('Posts per Day')
    ax.xaxis.set_major_formatter(mdates.DateFormatter('%Y-%m-%d'))
    fig.autofmt_xdate()
    plt.tight_layout()

weekly = aggregate_counts(dt_list, 'W')
if show_per_week:
    fig, ax = plt.subplots()
    ax.plot(list(weekly.keys()), list(weekly.values()), marker='', color = "#6BA65E")
    ax.set_title('Posts per Week')
    ax.set_xlabel('Week Starting')
    ax.set_ylabel('Posts per Week')
    ax.xaxis.set_major_formatter(mdates.DateFormatter('%Y-%m-%d'))
    fig.autofmt_xdate()
    plt.tight_layout()

monthly = aggregate_counts(dt_list, 'M')
if show_per_month:
    fig, ax = plt.subplots()
    ax.plot(list(monthly.keys()), list(monthly.values()), marker='', color = "#6BA65E")
    ax.set_title('Posts per Month')
    ax.set_xlabel('Month')
    ax.set_ylabel('Count')
    ax.xaxis.set_major_formatter(mdates.DateFormatter('%Y-%m'))
    fig.autofmt_xdate()
    plt.tight_layout()

fig, ax1 = plt.subplots(figsize=(8,4))
ax2 = ax1.twinx()

ax1.set_zorder(ax2.get_zorder() + 1)
ax1.patch.set_visible(False)

ax2.plot(
    list(daily.keys()), list(daily.values()), label='Posts per Day', color="#E54C4C", zorder=1)
ax2.set_ylabel('Posts per Day')
ax2.tick_params(axis='y')
if ppd_ylim != 0: ax2.set_ylim(0, ppd_ylim)
#ax2.set_yscale('log')

ax1.step(times, counts, where='post', label='Total Posts', color="#6BA65E", zorder=2)
ax1.set_xlabel('Date')
ax1.set_ylabel('Total Posts')
ax1.xaxis.set_major_formatter(mdates.DateFormatter('%Y-%m-%d'))
ax1.tick_params(axis='y')
#ax1.set_yscale('log')

lines1, labels1 = ax1.get_legend_handles_labels()
lines2, labels2 = ax2.get_legend_handles_labels()
ax1.legend(lines1 + lines2, labels1 + labels2, loc='upper left')

fig.autofmt_xdate()
plt.title(final_plot_title) 
plt.tight_layout()
plt.show()

HOW TO USE
1. Open your IDE of choice, and paste the code above into their own scripts. (Unfortunately for you CLIheads out there, these won't work from the command line.)
2. Go to the thread you want to chart, paste the link of its first page into thread_url, enter the number of pages it has into pages, and set the output file name with filename.

3. Run the code. You should start seeing this in the print area:

It will prompt you once it's finished and the CSV has been generated. The CSV will appear in the same directory as this script.

4. Open KiwiSpeedChart.py. Set csv_filename to the name of the csv you just generated, and set final_plot_title to what you want the chart title to be. ppd_ylim lets you adjust the height of the Posts per Day line, setting this higher will make the line shorter. Leave it as 0 and PyPlot will auto-set the height. I made this a setting so you can prevent the PPD line from overlapping with the Total Posts line too much.
For show_cumulative, show_per_day, show_per_week, and show_per_month, setting any of those to True will generate an extra line chart that shows cumulative total posts or posts per day, week, or month.

5. Run the code, and the chart(s) will appear in a new window. Use the Save icon to save it as a PNG.

Try it out! See how fast your favorite cow's thread moves!

Hooked on phobics · Jul 31, 2025

I love how I know the story behind the 2 bumps on Jasons thread. The wow crashout / DMCA, and later, SKG almost NOT getting 1 million as he TRIPLED DOWN.

skunt · Jul 31, 2025

do USPG2

gagabobo1997 · Jul 31, 2025

By the way, if you go to /page=100000 or some other large number, it just send you to the final page, meaning you can use that to calculate the total pages rather than having to hard code it.

Here's a quick update that does just that:

Python:

import requests
from html.parser import HTMLParser
from datetime import datetime
import csv
import re

## SETTINGS ##
thread_url = "https://kiwifarms.st/threads/xmr-monero.36856/"  # Base URL of thread
filename = "out.csv"  # Output file

class TimestampParser(HTMLParser):
    def __init__(self):
        super().__init__()
        self.timestamps = []
        self._in_lastedit = False
        self._in_embed = False
        self._embed_depth = 0

    def handle_starttag(self, tag, attrs):
        tag = tag.lower()
        attr_dict = {name.lower(): val for name, val in attrs}

        if tag == 'div' and 'class' in attr_dict and 'message-lastEdit' in attr_dict['class']:
            self._in_lastedit = True
            return
        if tag == 'div' and 'class' in attr_dict and 'fauxBlockLink' in attr_dict['class']:
            self._in_embed = True
            self._embed_depth = 1
            return
        if self._in_embed and tag == 'div':
            self._embed_depth += 1
            return
        if tag == 'time' and not self._in_lastedit and not self._in_embed:
            ts = None
            if 'title' in attr_dict:
                ts = attr_dict['title'].replace(',', '')
            elif 'datetime' in attr_dict:
                iso = attr_dict['datetime']
                try:
                    dt = datetime.fromisoformat(iso)
                    ts = dt.strftime('%b %d %Y at %I:%M %p').replace(' 0', ' ')
                except ValueError:
                    ts = iso
            if ts:
                self.timestamps.append(ts)

    def handle_endtag(self, tag):
        tag = tag.lower()
        if tag == 'div' and self._in_embed:
            self._embed_depth -= 1
            if self._embed_depth == 0:
                self._in_embed = False
        if tag == 'div' and self._in_lastedit:
            self._in_lastedit = False

def get_timestamps_from_page(url):
    resp = requests.get(url)
    resp.raise_for_status()
    parser = TimestampParser()
    parser.feed(resp.text)
    return parser.timestamps[1:]

def get_actual_last_page(base_url):
    test_url = base_url + "?page=1000000"
    resp = requests.get(test_url, allow_redirects=True)
    resp.raise_for_status()
    # Look for: <li class="pageNav-page pageNav-page--current "><a href="...">694</a></li>
    match = re.search(r'<li class="pageNav-page pageNav-page--current[^"]*">\s*<a[^>]*>(\d+)</a>', resp.text)
    if match:
        return int(match.group(1))
    raise RuntimeError("Failed to determine last page number.")

if __name__ == '__main__':
    print("Determining total number of pages...")
    pages = get_actual_last_page(thread_url)
    print(f"Total pages: {pages}")

    all_stamps = []
    for current_page in range(1, pages + 1):
        try:
            print(f"Scraping page {current_page} / {pages}...")
            stamps = get_timestamps_from_page(f"{thread_url}?page={current_page}")
            if stamps:
                all_stamps.extend(stamps)
            else:
                print("No valid timestamps found on that page.")
        except requests.RequestException as e:
            print(f"Error fetching page {current_page}: {e}")

    with open(filename, 'w', newline='') as csvfile:
        csv_writer = csv.writer(csvfile)
        csv_writer.writerows([[ts] for ts in all_stamps])
    print(f"Data saved to {filename}")

FYI I got banned before for scraping and making charts of reactions, I'm sure our dear feeder is less autistic about post times but still, scrape shit at your own risk

my penis is on fire · Jul 31, 2025

skunt said:
do USPG2

gampboonerisms · Jul 31, 2025

is this pinging the kf servers? will this be equal to a ddos?

Matzo Nazi · Jul 31, 2025

A fun script with a side of DDOS if it gets popular, sweet! Honestly I wish this was something the forum tools would provide in the first place, it's a cool idea, and shouldn't take multiple thousands of page loads to keep track of.

gagabobo1997 · Jul 31, 2025

gampboonerisms said:
is this pinging the kf servers? will this be equal to a ddos?

a DDoS would be a malicious attack and I would be very surprised if the servers couldn't handle a few autists scraping pages, but yes enough people doing it could hurt the servers. Loading every page in a thread sequentially is theoretically something that a human would do, so if you add a longer delay in between requests and just let it run overnight or something it should be fine.
unless josh ever releases a database or API, scraping is the only way that victims of autism like OP and I can get our fix.

Burd Turglar · Jul 31, 2025

Do Rekeita. I'm too lazy right now.

Harvey Danger · Jul 31, 2025

gampboonerisms said:
is this pinging the kf servers? will this be equal to a ddos?

gagabobo1997 said:
a DDoS would be a malicious attack

Unintentional DDOS is still a DDOS. Malice is not required, and servers don't care about good intentions while they churn and die.

gagabobo1997 said:
Loading every page in a thread sequentially is theoretically something that a human would do, so if you add a longer delay in between requests and just let it run overnight or something it should be fine.

Maybe I'm blind, but I don't see any delay built in. Why not throw a

time.sleep(5)

in there between page requests? This isn't time-critical or constantly changing data, the default should be a benign scrape overnight or something.

LarpBait · Jul 31, 2025

the poop + niggers dying thread

LarpBait said:
check out the stats on the shiwi's pph
View attachment 7720620
[ANTI-NULL CLITTY LEAKAGE THUMBNAIL EMBED]
geeeeg shiwiclitties have j*rtycvck pph its so fucking over just pack it up already
i stole this script from an aryan in this thread

AnOminous · Jul 31, 2025

Burd Turglar said:
Do Rekeita. I'm too lazy right now.

I'd say don't. At least not until there's a version with rate-limiting. That's well over 10,000 pages at this point.

gagabobo1997 · Jul 31, 2025

AnOminous said:
I'd say don't. At least not until there's a version with rate-limiting. That's well over 10,000 pages at this point.

Harvey Danger said:
Unintentional DDOS is still a DDOS. Malice is not required, and servers don't care about good intentions while they churn and die.

Maybe I'm blind, but I don't see any delay built in. Why not throw a

time.sleep(5)

in there between page requests? This isn't time-critical or constantly changing data, the default should be a benign scrape overnight or something.

Python:

import requests
from html.parser import HTMLParser
from datetime import datetime
import csv
import re
import argparse
import sys
import time

class TimestampParser(HTMLParser):
    def __init__(self):
        super().__init__()
        self.timestamps = []
        self._in_lastedit = False
        self._in_embed = False
        self._embed_depth = 0

    def handle_starttag(self, tag, attrs):
        tag = tag.lower()
        attr_dict = {name.lower(): val for name, val in attrs}

        if tag == 'div' and 'class' in attr_dict and 'message-lastEdit' in attr_dict['class']:
            self._in_lastedit = True
            return
        if tag == 'div' and 'class' in attr_dict and 'fauxBlockLink' in attr_dict['class']:
            self._in_embed = True
            self._embed_depth = 1
            return
        if self._in_embed and tag == 'div':
            self._embed_depth += 1
            return
        if tag == 'time' and not self._in_lastedit and not self._in_embed:
            ts = None
            if 'title' in attr_dict:
                ts = attr_dict['title'].replace(',', '')
            elif 'datetime' in attr_dict:
                iso = attr_dict['datetime']
                try:
                    dt = datetime.fromisoformat(iso)
                    ts = dt.strftime('%b %d %Y at %I:%M %p').replace(' 0', ' ')
                except ValueError:
                    ts = iso
            if ts:
                self.timestamps.append(ts)

    def handle_endtag(self, tag):
        tag = tag.lower()
        if tag == 'div' and self._in_embed:
            self._embed_depth -= 1
            if self._embed_depth == 0:
                self._in_embed = False
        if tag == 'div' and self._in_lastedit:
            self._in_lastedit = False

def get_timestamps_from_page(url):
    resp = requests.get(url)
    resp.raise_for_status()
    parser = TimestampParser()
    parser.feed(resp.text)
    return parser.timestamps[1:]

def get_actual_last_page(base_url):
    test_url = base_url + "?page=1000000"
    resp = requests.get(test_url, allow_redirects=True)
    resp.raise_for_status()
    match = re.search(r'<li class="pageNav-page pageNav-page--current[^"]*">\s*<a[^>]*>(\d+)</a>', resp.text)
    if match:
        return int(match.group(1))
    raise RuntimeError("Failed to determine last page number.")

def main():
    parser = argparse.ArgumentParser(description="scrape post timestamps")
    parser.add_argument("url", help="URL (https://kiwifarms.st/threads/thread-title.12345/)")
    parser.add_argument("-o", "--output", default="output.csv", help="output filename")
    parser.add_argument("-d", "--delay", type=int, default=0, help="delay between requests in milliseconds")
    args = parser.parse_args()

    thread_url = args.url.rstrip('/')
    filename = args.output
    delay_sec = args.delay / 1000.0

    print("Determining total number of pages...")
    try:
        pages = get_actual_last_page(thread_url)
    except Exception as e:
        print(f"Failed to determine last page: {e}")
        sys.exit(1)

    print(f"Total pages: {pages}")

    all_stamps = []
    for current_page in range(1, pages + 1):
        try:
            print(f"Scraping page {current_page} / {pages}...")
            page_url = f"{thread_url}?page={current_page}"
            stamps = get_timestamps_from_page(page_url)
            if stamps:
                all_stamps.extend(stamps)
            else:
                print("No valid timestamps found on that page.")
            if delay_sec > 0:
                time.sleep(delay_sec)
        except requests.RequestException as e:
            print(f"Error fetching page {current_page}: {e}")

    with open(filename, 'w', newline='') as csvfile:
        csv_writer = csv.writer(csvfile)
        csv_writer.writerows([[ts] for ts in all_stamps])

    print(f"Data saved to {filename}")

if __name__ == '__main__':
    main()

Updated version of OP's script but instead of hard coding the URL and output you use CLI arguments, and you can add a custom delay. Example:

python .\scaper.py https://kiwifarms.st/threads/xmr-monero.36856/ -o xmr -d 5000

This would scrape the XMR/Monero thread timestamps, with a 5000 millisecond delay in between requests, and output to xmr.csv

skunt · Jul 31, 2025

It'd be a DoS, not a DDoS :geek:

I didn't read the code and just assumed it used a kiwiflare cookie or something but it appears kiwiflare is just disabled at the moment? Spooky.

my penis is on fire · Jul 31, 2025

In my defense it doesn't request a page until it's done parsing the last page, so on my machine it sends a request about every half second. Yeah it's not true and honest rate limiting but it at least isn't just spam pinging the server.
Anyway,

skunt said:
do USPG2

Not doing any more tonight to make sure Null doesn't come to my house and kill me with a hammer

NoReturn · Jul 31, 2025

Great jerb!

HexFag · Aug 1, 2025

Here's the one for BossmanJack. It's funny to see the post speed increase and decrease based on when he's in and out of jail/rehab.
Also I didn't know that the script ratelimited the shit out of the site sorry for unintentionally ddossing the site for a bit :stress: