#!/bin/bash -l
-http_get https://html.com/attributes/ \
+
+# NB 01.06.23: TODEL
+false && http_get https://html.com/attributes/ \
| sed -E "s,<(thrive_headline|header)[^.>]+>([^<]+)</\1>,<div>\2</div>," \
| xmllint --html --xpath //table - 2>/dev/null \
| sed -E "s,<a[^>]+href=\"((https://html.com)?/attributes/([^\"\/]+)\/?)[^<]+</a>,\3</td><td>https://html.com/\1,g" \
| xml2csv - \
| awk 'BEGIN{FS="\t"}{print $1"\t"$3"\t"$2}' \
+
+
+true && http_get https://www.w3schools.com/tags/ref_attributes.asp | \
+xmllint --html --xpath '/html/body//div[@id="main"]//table' - 2>/dev/null | \
+grep -v 'href="tag_' | \
+perl -pe 's|<td[^>]*><a href="([^"]+)">([^<]+)</a></td>|<td>https://www.w3schools.com/tags/$1</td><td>$2</td>|' | \
+html2csv | \
+sed -E "s,(\\\\),\1\1," | \
+awk 'BEGIN{FS="\t"} /www\.w3schools\.com/ {print $2"\t"$3"\t"$1}' \
+