From d12aa3d042f90260ba0652ddaf2f488a50a83816 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 6 Dec 2018 11:27:03 -0600
Subject: [PATCH 001/245] Reorg profile-data.sql.js

---
 dbs/schemas/profile-data.sql.js | 83 +++++++++++++++++----------------
 1 file changed, 43 insertions(+), 40 deletions(-)

diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index 39b9090a..2c94e90c 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -46,18 +46,6 @@ CREATE TABLE archives_meta_type (
   type TEXT
 );
 
--- a list of the draft-dats for a master-dat
-CREATE TABLE archive_drafts (
-  profileId INTEGER,
-  masterKey TEXT, -- key of the master dat
-  draftKey TEXT, -- key of the draft dat
-  createdAt INTEGER DEFAULT (strftime('%s', 'now')),
-
-  isActive INTEGER, -- is this the active draft? (deprecated)
-
-  FOREIGN KEY (profileId) REFERENCES profiles (id) ON DELETE CASCADE
-);
-
 CREATE TABLE bookmarks (
   profileId INTEGER,
   url TEXT NOT NULL,
@@ -72,17 +60,6 @@ CREATE TABLE bookmarks (
   FOREIGN KEY (profileId) REFERENCES profiles (id) ON DELETE CASCADE
 );
 
-CREATE TABLE templates (
-  profileId INTEGER,
-  url TEXT NOT NULL,
-  title TEXT,
-  screenshot,
-  createdAt INTEGER DEFAULT (strftime('%s', 'now')),
-
-  PRIMARY KEY (profileId, url),
-  FOREIGN KEY (profileId) REFERENCES profiles (id) ON DELETE CASCADE
-);
-
 CREATE TABLE visits (
   profileId INTEGER,
   url TEXT NOT NULL,
@@ -102,8 +79,48 @@ CREATE TABLE visit_stats (
 CREATE VIRTUAL TABLE visit_fts USING fts4 (url, title);
 CREATE UNIQUE INDEX visits_stats_url ON visit_stats (url);
 
--- list of the user's installed apps
+-- list of dats being looked for
+CREATE TABLE watchlist (
+  profileId INTEGER NOT NULL,
+  url TEXT NOT NULL,
+  description TEXT NOT NULL,
+  seedWhenResolved BOOLEAN NOT NULL,
+  resolved BOOLEAN NOT NULL DEFAULT (0),
+  updatedAt INTEGER DEFAULT (strftime('%s', 'now')),
+  createdAt INTEGER DEFAULT (strftime('%s', 'now')),
+ 
+  PRIMARY KEY (profileId, url),
+  FOREIGN KEY (profileId) REFERENCES profiles (id) ON DELETE CASCADE
+);
+
+-- list of the users current templates
+-- deprecated (may return)
+CREATE TABLE templates (
+  profileId INTEGER,
+  url TEXT NOT NULL,
+  title TEXT,
+  screenshot,
+  createdAt INTEGER DEFAULT (strftime('%s', 'now')),
+
+  PRIMARY KEY (profileId, url),
+  FOREIGN KEY (profileId) REFERENCES profiles (id) ON DELETE CASCADE
+);
+
+-- a list of the draft-dats for a master-dat
 -- deprecated
+CREATE TABLE archive_drafts (
+  profileId INTEGER,
+  masterKey TEXT, -- key of the master dat
+  draftKey TEXT, -- key of the draft dat
+  createdAt INTEGER DEFAULT (strftime('%s', 'now')),
+
+  isActive INTEGER, -- is this the active draft? (deprecated)
+
+  FOREIGN KEY (profileId) REFERENCES profiles (id) ON DELETE CASCADE
+);
+
+-- list of the users installed apps
+-- deprecated (may return)
 CREATE TABLE apps (
   profileId INTEGER NOT NULL,
   name TEXT NOT NULL,
@@ -115,8 +132,8 @@ CREATE TABLE apps (
   FOREIGN KEY (profileId) REFERENCES profiles (id) ON DELETE CASCADE
 );
 
--- log of the user's app installations
--- deprecated
+-- log of the users app installations
+-- deprecated (may return)
 CREATE TABLE apps_log (
   profileId INTEGER NOT NULL,
   name TEXT NOT NULL,
@@ -126,20 +143,6 @@ CREATE TABLE apps_log (
   FOREIGN KEY (profileId) REFERENCES profiles (id) ON DELETE CASCADE
 );
 
--- add a database for watchlist feature
-CREATE TABLE watchlist (
-  profileId INTEGER NOT NULL,
-  url TEXT NOT NULL,
-  description TEXT NOT NULL,
-  seedWhenResolved BOOLEAN NOT NULL,
-  resolved BOOLEAN NOT NULL DEFAULT (0),
-  updatedAt INTEGER DEFAULT (strftime('%s', 'now')),
-  createdAt INTEGER DEFAULT (strftime('%s', 'now')),
- 
-  PRIMARY KEY (profileId, url),
-  FOREIGN KEY (profileId) REFERENCES profiles (id) ON DELETE CASCADE
-);
-
 -- deprecated
 CREATE TABLE workspaces (
   profileId INTEGER NOT NULL,

From 0a4e01f6fcb988f029831a4f70ec0b440b43174f Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 6 Dec 2018 14:44:42 -0600
Subject: [PATCH 002/245] Add the beaker.posts and beaker.followgraph API
 skeletons

---
 crawler/followgraph.js                     | 16 ++++++++++++++++
 crawler/posts.js                           | 20 ++++++++++++++++++++
 web-apis/bg.js                             |  6 ++++++
 web-apis/fg/beaker.js                      | 17 +++++++++++++++++
 web-apis/manifests/internal/followgraph.js |  6 ++++++
 web-apis/manifests/internal/posts.js       |  7 +++++++
 6 files changed, 72 insertions(+)
 create mode 100644 crawler/followgraph.js
 create mode 100644 crawler/posts.js
 create mode 100644 web-apis/manifests/internal/followgraph.js
 create mode 100644 web-apis/manifests/internal/posts.js

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
new file mode 100644
index 00000000..172d75ea
--- /dev/null
+++ b/crawler/followgraph.js
@@ -0,0 +1,16 @@
+
+exports.queryAll = function () {
+  throw new Error('Not yet implemented')
+}
+
+exports.query = function () {
+  throw new Error('Not yet implemented')
+}
+
+exports.follow = function () {
+  throw new Error('Not yet implemented')
+}
+
+exports.unfollow = function () {
+  throw new Error('Not yet implemented')
+}
diff --git a/crawler/posts.js b/crawler/posts.js
new file mode 100644
index 00000000..58341be9
--- /dev/null
+++ b/crawler/posts.js
@@ -0,0 +1,20 @@
+
+exports.list = async function () {
+  throw new Error('Not yet implemented')
+}
+
+exports.get = async function () {
+  throw new Error('Not yet implemented')
+}
+
+exports.create = async function () {
+  throw new Error('Not yet implemented')
+}
+
+exports.edit = async function () {
+  throw new Error('Not yet implemented')
+}
+
+exports.delete = async function () {
+  throw new Error('Not yet implemented')
+}
\ No newline at end of file
diff --git a/web-apis/bg.js b/web-apis/bg.js
index 7b431c04..6702b4cb 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -10,6 +10,8 @@ const downloadsManifest = require('./manifests/internal/downloads')
 const historyManifest = require('./manifests/internal/history')
 const sitedataManifest = require('./manifests/internal/sitedata')
 const watchlistManifest = require('./manifests/internal/watchlist')
+const postsManifest = require('./manifests/internal/posts')
+const followgraphManifest = require('./manifests/internal/followgraph')
 
 // internal apis
 const archivesAPI = require('./bg/archives')
@@ -17,6 +19,8 @@ const bookmarksAPI = require('./bg/bookmarks')
 const historyAPI = require('./bg/history')
 const sitedataAPI = require('../dbs/sitedata').WEBAPI
 const watchlistAPI = require('./bg/watchlist')
+const postsAPI = require('../crawler/posts')
+const followgraphAPI = require('../crawler/followgraph')
 
 // external manifests
 const datArchiveManifest = require('./manifests/external/dat-archive')
@@ -50,6 +54,8 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('history', historyManifest, historyAPI, internalOnly)
   globals.rpcAPI.exportAPI('sitedata', sitedataManifest, sitedataAPI, internalOnly)
   globals.rpcAPI.exportAPI('watchlist', watchlistManifest, watchlistAPI, internalOnly)
+  globals.rpcAPI.exportAPI('posts', postsManifest, postsAPI, internalOnly)
+  globals.rpcAPI.exportAPI('followgraph', followgraphManifest, followgraphAPI, internalOnly)
 
   // external apis
   globals.rpcAPI.exportAPI('dat-archive', datArchiveManifest, datArchiveAPI, secureOnly)
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index 0d463cee..f356c463 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -8,6 +8,8 @@ const downloadsManifest = require('../manifests/internal/downloads')
 const historyManifest = require('../manifests/internal/history')
 const sitedataManifest = require('../manifests/internal/sitedata')
 const watchlistManifest = require('../manifests/internal/watchlist')
+const postsManifest = require('../manifests/internal/posts')
+const followgraphManifest = require('../manifests/internal/followgraph')
 
 exports.setup = function (rpc) {
   const beaker = {}
@@ -22,6 +24,8 @@ exports.setup = function (rpc) {
     const historyRPC = rpc.importAPI('history', historyManifest, opts)
     const sitedataRPC = rpc.importAPI('sitedata', sitedataManifest, opts)
     const watchlistRPC = rpc.importAPI('watchlist', watchlistManifest, opts)
+    const postsRPC = rpc.importAPI('posts', postsManifest, opts)
+    const followgraphRPC = rpc.importAPI('followgraph', followgraphManifest, opts)
 
     // beaker.archives
     beaker.archives = new EventTarget()
@@ -148,6 +152,19 @@ exports.setup = function (rpc) {
     beaker.watchlist.update = watchlistRPC.update
     beaker.watchlist.remove = watchlistRPC.remove
     beaker.watchlist.createEventsStream = () => fromEventStream(watchlistRPC.createEventsStream())
+
+    // beaker.posts
+    beaker.posts.list = postsRPC.list
+    beaker.posts.get = postsRPC.get
+    beaker.posts.create = postsRPC.create
+    beaker.posts.edit = postsRPC.edit
+    beaker.posts.delete = postsRPC.delete
+
+    // beaker.followgraph
+    beaker.followgraph.queryall = followgraphRPC.queryall
+    beaker.followgraph.query = followgraphRPC.query
+    beaker.followgraph.follow = followgraphRPC.follow
+    beaker.followgraph.unfollow = followgraphRPC.unfollow
   }
 
   return beaker
diff --git a/web-apis/manifests/internal/followgraph.js b/web-apis/manifests/internal/followgraph.js
new file mode 100644
index 00000000..8c8549c8
--- /dev/null
+++ b/web-apis/manifests/internal/followgraph.js
@@ -0,0 +1,6 @@
+module.exports = {
+  queryAll: 'promise',
+  query: 'promise',
+  follow: 'promise',
+  unfollow: 'promise'
+}
\ No newline at end of file
diff --git a/web-apis/manifests/internal/posts.js b/web-apis/manifests/internal/posts.js
new file mode 100644
index 00000000..b4e21d9b
--- /dev/null
+++ b/web-apis/manifests/internal/posts.js
@@ -0,0 +1,7 @@
+module.exports = {
+  list: 'promise',
+  get: 'promise',
+  create: 'promise',
+  edit: 'promise',
+  delete: 'promise'
+}
\ No newline at end of file

From 428568f6a357d49e190307fdbbfaf4249cd755c5 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 6 Dec 2018 19:25:08 -0600
Subject: [PATCH 003/245] Implement the majority of the crawler (WIP)

---
 crawler/followgraph.js          |  87 ++++++++++++++-
 crawler/index.js                |  63 +++++++++++
 crawler/posts.js                | 107 ++++++++++++++++++-
 crawler/util.js                 |  45 ++++++++
 dat/library.js                  |   5 +-
 dbs/schemas/profile-data.sql.js |  51 +++++++++
 index.js                        |  13 ++-
 users/index.js                  | 180 ++++++++++++++++++++++++++++++++
 8 files changed, 533 insertions(+), 18 deletions(-)
 create mode 100644 crawler/index.js
 create mode 100644 crawler/util.js
 create mode 100644 users/index.js

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index 172d75ea..6ccfab45 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -1,16 +1,95 @@
+const Events = require('events')
+const db = require('../dbs/profile-data-db')
+const {doCrawl} = require('./util')
 
-exports.queryAll = function () {
-  throw new Error('Not yet implemented')
+// constants
+// =
+
+const TABLE_VERSION = 1
+
+// globals
+// =
+
+var events = new Events()
+
+// exported api
+// =
+
+exports.on = events.on.bind(events)
+exports.addListener = events.addListener.bind(events)
+exports.removeListener = events.removeListener.bind(events)
+
+exports.crawlSite = async function (archive) {
+  return doCrawl(archive, 'crawl_followgraph', TABLE_VERSION, async ({changes, resetRequired}) => {
+    if (resetRequired) {
+      // reset all data
+      // TODO
+    }
+
+    // find files that need to be processed
+    // TODO
+
+    // process the files
+    // TODO
+    // events.emit('follow-added', sourceUrl, subjectUrl)
+    // events.emit('follow-removed', sourceUrl, subjectUrl)
+  })
 }
 
-exports.query = function () {
-  throw new Error('Not yet implemented')
+// List urls of sites that follow subject
+// - subject. String (URL).
+// - returns Array<String>
+exports.listFollowers = async function (subject) {
+  var rows = await db.all(`
+    SELECT crawl_sources.url
+      FROM crawl_sources
+      INNER JOIN crawl_followgraph
+        ON crawl_followgraph.crawlSourceId = crawl_sources.id
+        AND crawl_followgraph.destUrl = ?
+  `, [subject])
+  return rows.map(row => row.url)
+}
+
+// List urls of sites that subject follows
+// - subject. String (URL).
+// - returns Array<String>
+exports.listFollows = async function (subject) {
+  var rows = await db.all(`
+    SELECT crawl_followgraph.destUrl
+      FROM crawl_followgraph
+      INNER JOIN crawl_sources
+        ON crawl_followgraph.crawlSourceId = crawl_sources.id
+        AND crawl_sources.url = ?
+  `, [subject])
+  return rows.map(row => row.destUrl)
+}
+
+// Check for the existence of an individual follow
+// - a. String (URL), the site being queried.
+// - b. String (URL), does a follow this site?
+// - returns bool
+exports.isAFollowingB = async function (a, b) {
+  var res = await db.get(`
+    SELECT crawl_sources.id
+      FROM crawl_sources
+      INNER JOIN crawl_followgraph
+        ON crawl_followgraph.crawlSourceId = crawl_sources.id
+        AND crawl_followgraph.destUrl = ?
+      WHERE crawl_sources.url = ?
+  `, [b, a])
+  return !!res
 }
 
 exports.follow = function () {
   throw new Error('Not yet implemented')
+
+  // update the user dat
+  // TODO
 }
 
 exports.unfollow = function () {
   throw new Error('Not yet implemented')
+
+  // update the user dat
+  // TODO
 }
diff --git a/crawler/index.js b/crawler/index.js
new file mode 100644
index 00000000..f87825f3
--- /dev/null
+++ b/crawler/index.js
@@ -0,0 +1,63 @@
+const _throttle = require('lodash.throttle')
+const lock = require('../lib/lock')
+const users = require('../users')
+const dat = require('../dat')
+
+const posts = require('./posts')
+const followgraph = require('./followgraph')
+
+// globals
+// =
+
+const watches = {}
+
+// exported api
+// =
+
+exports.posts = posts
+exports.followgraph = followgraph
+
+exports.setup = async function () {
+}
+
+exports.watchSite = async function (archive) {
+  if (typeof archive === 'string') {
+    archive = await dat.library.getOrLoadArchive()
+  }
+
+  if (!(archive.url in watches)) {
+    const queueCrawl = _throttle(() => crawlSite(archive), 5e3)
+
+    // watch for file changes
+    watches[archive.url] = archive.pda.watch()
+    watches[archive.url].on('data', ([event, args]) => {
+      if (event === 'invalidated') {
+        queueCrawl()
+      }
+    })
+
+    // run the first crawl
+    crawlSite(archive)
+  }
+}
+
+exports.unwatchSite = async function (url) {
+  // stop watching for file changes
+  if (url in watches) {
+    watches[url].close()
+    watches[url] = null
+  }
+}
+
+async function crawlSite (archive) {
+  var release = await lock('crawl:' + archive.url)
+  try {
+    await Promise.all([
+      posts.crawlSite(archive),
+      followgraph.crawlSite(archive)
+    ])
+  } finally {
+    release()
+  }
+}
+exports.crawlSite = crawlSite
\ No newline at end of file
diff --git a/crawler/posts.js b/crawler/posts.js
index 58341be9..07479d75 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -1,20 +1,117 @@
+const assert = require('assert')
+const {URL} = require('url')
+const Events = require('events')
+const db = require('../dbs/profile-data-db')
+const {doCrawl} = require('./util')
 
-exports.list = async function () {
-  throw new Error('Not yet implemented')
+// constants
+// =
+
+const TABLE_VERSION = 1
+
+// globals
+// =
+
+var events = new Events()
+
+// exported api
+// =
+
+exports.on = events.on.bind(events)
+exports.addListener = events.addListener.bind(events)
+exports.removeListener = events.removeListener.bind(events)
+
+exports.crawlSite = async function (archive) {
+  return doCrawl(archive, 'crawl_posts', TABLE_VERSION, async ({changes, resetRequired}) => {
+    if (resetRequired) {
+      // reset all data
+      // TODO
+    }
+
+    // find files that need to be processed
+    // TODO
+
+    // process the files
+    // TODO
+    // events.emit('post-added', sourceUrl)
+    // events.emit('post-updated', sourceUrl)
+    // events.emit('post-removed', sourceUrl)
+  })
 }
 
-exports.get = async function () {
-  throw new Error('Not yet implemented')
+exports.list = async function ({offset, limit, reverse, author} = {}) {
+  // validate & parse params
+  assert(!offset || typeof offset === 'number', 'Offset must be a number')
+  assert(!limit || typeof limit === 'number', 'Limit must be a number')
+  assert(!reverse || typeof reverse === 'boolean', 'Reverse must be a boolean')
+  assert(!author || typeof author === 'string', 'Author must be a string')
+  if (author) {
+    try { author = new URL(author) }
+    catch (e) { throw new Error('Failed to parse author URL: ' + author) }
+  }
+
+  // build query
+  var query = `SELECT crawl_posts.*, src.url AS crawlSourceUrl FROM crawl_posts`
+  var values = []
+  if (author) {
+    query += ` INNER JOIN crawl_sources src ON src.url = ?`
+    values.push(author.origin)
+  }
+  if (offset) {
+    query += ` OFFSET ?`
+    values.push(offset)
+  }
+  if (limit) {
+    query += ` LIMIT ?`
+    values.push(limit)
+  }
+  query += ` ORDER BY createdAt`
+  if (reverse) {
+    query += ` DESC`
+  }
+
+  // execute query
+  return db.all(query, values)
+}
+
+exports.get = async function (url, pathname = undefined) {
+  // validate & parse params
+  if (url) {
+    try { url = new URL(url) }
+    catch (e) { throw new Error('Failed to parse post URL: ' + url) }
+  }
+  pathname = pathname || url.pathname
+
+  // execute query
+  return db.get(`
+    SELECT
+        crawl_posts.*, src.url AS crawlSourceUrl
+      FROM crawl_posts
+      INNER JOIN crawl_sources src
+        ON src.id = crawl_posts.crawlSourceId
+        AND src.url = ?
+      WHERE
+        crawl_posts.pathname = ?
+  `, [url.origin, pathname])
 }
 
 exports.create = async function () {
   throw new Error('Not yet implemented')
+
+  // update the user dat
+  // TODO
 }
 
 exports.edit = async function () {
   throw new Error('Not yet implemented')
+
+  // update the user dat
+  // TODO
 }
 
 exports.delete = async function () {
   throw new Error('Not yet implemented')
-}
\ No newline at end of file
+
+  // update the user dat
+  // TODO
+}
diff --git a/crawler/util.js b/crawler/util.js
new file mode 100644
index 00000000..303f25c0
--- /dev/null
+++ b/crawler/util.js
@@ -0,0 +1,45 @@
+const db = require('../dbs/profile-data-db')
+
+exports.doCrawl = async function (archive, crawlDataset, crawlDatasetVersion, handlerFn) {
+  const url = archive.url
+
+  // fetch current crawl state
+  var resetRequired = false
+  var state = await db.get(`
+    SELECT crawl_sources_meta.* FROM crawl_sources_meta
+      INNER JOIN crawl_sources ON crawl_sources.url = ?
+      WHERE crawl_sources_meta.crawlDataset = ?
+  `, [url, crawlDataset])
+  if (state.crawlDatasetVersion !== crawlDatasetVersion) {
+    resetRequired = true
+    state = null
+  }
+  if (!state) {
+    // new state
+    state = {
+      crawlSourceId: null,
+      url,
+      crawlDataset,
+      crawlDatasetVersion,
+      updatedAt: 0
+    }
+  }
+
+  // fetch current archive version
+  // TODO
+
+  // fetch change log
+  var changes = [] // TODO
+
+  // handle changes
+  await handlerFn({changes, resetRequired})
+
+  if (!state.crawlSourceId) {
+    // upsert crawl source
+    // TODO
+  }
+
+  // upsert crawl state
+  state.updatedAt = Date.now()
+  // TODO
+}
\ No newline at end of file
diff --git a/dat/library.js b/dat/library.js
index e17dfb38..1cb63df5 100644
--- a/dat/library.js
+++ b/dat/library.js
@@ -5,7 +5,7 @@ const pify = require('pify')
 const pda = require('pauls-dat-api')
 const signatures = require('sodium-signatures')
 const parseDatURL = require('parse-dat-url')
-const debounce = require('lodash.debounce')
+const _debounce = require('lodash.debounce')
 const mkdirp = require('mkdirp')
 
 // dbs
@@ -312,7 +312,7 @@ async function loadArchiveInner (key, secretKey, userSettings = null) {
   await pullLatestArchiveMeta(archive)
 
   // wire up events
-  archive.pullLatestArchiveMeta = debounce(opts => pullLatestArchiveMeta(archive, opts), 1e3)
+  archive.pullLatestArchiveMeta = _debounce(opts => pullLatestArchiveMeta(archive, opts), 1e3)
   archive.fileActStream = archive.pda.watch()
   archive.fileActStream.on('data', ([event, {path}]) => {
     if (event === 'changed') {
@@ -535,6 +535,7 @@ function createArchiveProxy (key, version, archiveInfo) {
   const pdaStat = makeArchiveProxyPDAPromiseFn(key, version, 'stat')
   return {
     key: datEncoding.toBuf(key),
+    url: `dat://${key}`,
     discoveryKey: datEncoding.toBuf(archiveInfo.discoveryKey),
     writable: archiveInfo.writable,
 
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index 2c94e90c..46cbd6a7 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -5,6 +5,13 @@ CREATE TABLE profiles (
   createdAt INTEGER DEFAULT (strftime('%s', 'now'))
 );
 
+CREATE TABLE users (
+  id INTEGER PRIMARY KEY NOT NULL,
+  url TEXT,
+  isDefault INTEGER DEFAULT 0,
+  createdAt INTEGER
+);
+
 CREATE TABLE archives (
   profileId INTEGER NOT NULL,
   key TEXT NOT NULL, -- dat key
@@ -93,6 +100,50 @@ CREATE TABLE watchlist (
   FOREIGN KEY (profileId) REFERENCES profiles (id) ON DELETE CASCADE
 );
 
+-- list of sites being crawled
+CREATE TABLE crawl_sources (
+  id INTEGER PRIMARY KEY NOT NULL,
+  url TEXT NOT NULL
+);
+
+-- tracking information on the crawl-state of the sources
+CREATE TABLE crawl_sources_meta (
+  crawlSourceId INTEGER NOT NULL,
+  crawlSourceVersion INTEGER NOT NULL,
+  crawlDataset TEXT NOT NULL,
+  crawlDatasetVersion INTEGER NOT NULL,
+  updatedAt INTEGER DEFAULT,
+
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+
+-- crawled posts
+CREATE TABLE crawl_posts (
+  crawlSourceId INTEGER NOT NULL,
+  pathname TEXT NOT NULL,
+
+  type TEXT NOT NULL,
+  content TEXT,
+
+  createdAt INTEGER DEFAULT (strftime('%s', 'now')),
+  updatedAt INTEGER DEFAULT (strftime('%s', 'now')),
+  crawledAt INTEGER DEFAULT (strftime('%s', 'now')),
+
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+
+-- crawled follows
+CREATE TABLE crawl_followgraph (
+  crawlSourceId INTEGER NOT NULL,
+  
+  destUrl TEXT NOT NULL,
+
+  updatedAt INTEGER DEFAULT (strftime('%s', 'now')),
+  crawledAt INTEGER DEFAULT (strftime('%s', 'now')),
+
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+
 -- list of the users current templates
 -- deprecated (may return)
 CREATE TABLE templates (
diff --git a/index.js b/index.js
index decbfc1e..7f46ea90 100644
--- a/index.js
+++ b/index.js
@@ -5,6 +5,8 @@ const globals = require('./globals')
 const {getEnvVar} = require('./lib/env')
 const dat = require('./dat')
 const dbs = require('./dbs')
+const users = require('./users')
+const crawler = require('./crawler')
 const webapis = require('./web-apis/bg')
 const spellChecker = require('./web-apis/bg/spell-checker')
 const spellCheckerLib = require('./lib/spell-checker')
@@ -45,16 +47,13 @@ module.exports = {
       }
     }
 
-    // setup dat
+    // start subsystems
+    // (order is important)
     await dat.library.setup(opts)
-
-    // setup watchlist
     await dat.watchlist.setup()
-
-    // setup web apis
+    await crawler.setup(opts)
+    await users.setup(opts)
     webapis.setup(opts)
-
-    // setup spellchecker
     spellCheckerLib.setup()
   }
 }
diff --git a/users/index.js b/users/index.js
new file mode 100644
index 00000000..da8b72b4
--- /dev/null
+++ b/users/index.js
@@ -0,0 +1,180 @@
+const Events = require('events')
+const dat = require('../dat')
+const crawler = require('../crawler')
+const db = require('../dbs/profile-data-db')
+const archivesDb = require('../dbs/archives')
+const debug = require('../lib/debug-logger').debugLogger('users')
+
+// globals
+// =
+
+var events = new Events()
+var users
+
+// exported api
+// =
+
+exports.on = events.on.bind(events)
+exports.addListener = events.addListener.bind(events)
+exports.removeListener = events.removeListener.bind(events)
+
+exports.setup = async function () {
+  // wire up events
+  crawler.followgraph.on('follow-added', onFollowAdded)
+  crawler.followgraph.on('follow-removed', onFollowRemoved)
+
+  // load the current users
+  users = await db.all(`SELECT * FROM users`)
+  users.forEach(async (user) => {
+    // massage data
+    user.archive = null
+    user.isDefault = Boolean(user.isDefault)
+    user.createdAt = new Date(user.createdAt)
+
+    // fetch the user archive
+    try {
+      await validateUserUrl(user.url)
+      user.archive = await dat.library.getOrLoadArchive(user.url)
+      watchUser(user)
+      events.emit('load-user', user)
+    } catch (err) {
+      debug('Failed to load user', {user, err})
+    }
+  })
+}
+
+exports.getAll = async function () {
+  return Promise.all(users.map(fetchUserInfo))
+}
+
+const get =
+exports.get = async function (url) {
+  var user = users.find(user => user.url === url)
+  if (!user) return null
+  return await fetchUserInfo(user)
+}
+
+const getDefault =
+exports.getDefault = async function (url = undefined) {
+  var user = users.find(user => user.isDefault === true)
+  if (!user) return null
+  return await fetchUserInfo(user)
+}
+
+exports.add = async function (url) {
+  // make sure the user doesnt already exist
+  var existingUser = await get(url)
+  if (existingUser) return
+
+  // validate
+  await validateUserUrl(url)
+
+  // create the new user
+  var user = {
+    url,
+    archive: null,
+    isDefault: users.length === 0,
+    createdAt: Date.now()
+  }
+  await db.run(
+    `INSERT INTO users (url, isDefault, createdAt) VALUES (?, ?, ?)`,
+    [user.url, Number(user.isDefault), user.createdAt]
+  )
+
+  // fetch the user archive
+  user.archive = await dat.library.getOrLoadArchive(user.url)
+  watchUser(user)
+  events.emit('load-user', user)
+}
+
+exports.remove = async function (url) {
+  // get the user
+  var user = await get(url)
+  if (!user) return
+
+  // remove the user
+  users.splice(users.indexOf(user), 1)
+  await db.run(`DELETE FROM users WHERE url = ?`, [user.url])
+  unwatchUser(user)
+  events.emit('unload-user', user)
+}
+
+// internal methods
+// =
+
+async function isUser (url) {
+  return !!(await get(url))
+}
+
+async function watchUser (user) {
+  // watch the user
+  await crawler.watchSite(user.archive)
+
+  // watch anybody the user follows
+  var followUrls = await crawler.followgraph.listFollows(user.url)
+  followUrls.forEach(async (followUrl) => {
+    try {
+      await crawler.watchSite(followUrl)
+    } catch (err) {
+      debug('Failed to sync followed user', {url: followUrl, err})
+    }
+  })
+}
+
+async function unwatchUser (user) {
+  // unwatch anybody the user follows
+
+  // BUG This will cause glitches if there are any shared follows between 2 local users (which is likely)
+  //     sites will be unwatched when they shouldn't be
+  //     this is temporary and will fix itself when beaker restarts
+  //     -prf
+
+  var followUrls = await crawler.followgraph.listFollows(user.url)
+  followUrls.forEach(crawler.unwatchSite)
+
+  // unwatch the user
+  await crawler.unwatchSite(user.url)
+}
+
+async function onFollowAdded (sourceUrl, subjectUrl) {
+  if (isUser(sourceUrl)) {
+    try {
+      await crawler.watchSite(subjectUrl)
+    } catch (err) {
+      debug('Failed to sync followed user', {url: subjectUrl, err})
+    }
+  }
+}
+
+async function onFollowRemoved (sourceUrl, subjectUrl) {
+  if (isUser(sourceUrl)) {
+    await crawler.unwatchSite(subjectUrl)
+  }
+}
+
+async function fetchUserInfo (user) {
+  var urlp = new URL(user.url)
+  var meta = await archivesDb.getMeta(urlp.hostname)
+  return {
+    url: user.url,
+    isDefault: user.isDefault,
+    title: meta.title,
+    description: meta.description,
+    createdAt: user.createdAt
+  }
+}
+
+async function validateUserUrl (url) {
+  // make sure the archive is saved and that we own the archive
+  var urlp = new URL(url)
+  var [meta, userSettings] = await Promise.all([
+    archivesDb.getMeta(urlp.hostname),
+    archivesDb.getUserSettings(urlp.hostname)
+  ])
+  if (!meta.isOwner) {
+    throw new Error('User dat is not owned by this device')
+  }
+  if (!userSettings.isSaved) {
+    throw new Error('User dat has been deleted')
+  }
+}

From 36e1f9e7397cebb902fa3d6202c00f85bc97185f Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 6 Dec 2018 21:55:49 -0600
Subject: [PATCH 004/245] Implement post and follows crawlers

---
 crawler/followgraph.js          | 65 +++++++++++++++++++++----
 crawler/index.js                |  9 +++-
 crawler/posts.js                | 85 ++++++++++++++++++++++++++++-----
 crawler/util.js                 |  4 ++
 dbs/schemas/profile-data.sql.js | 13 ++---
 package.json                    |  1 +
 users/index.js                  |  8 ++++
 7 files changed, 154 insertions(+), 31 deletions(-)

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index 6ccfab45..f75d7a44 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -1,11 +1,15 @@
+const assert = require('assert')
+const _difference = require('lodash.difference')
 const Events = require('events')
 const db = require('../dbs/profile-data-db')
-const {doCrawl} = require('./util')
+const {doCrawl, doCheckpoint} = require('./util')
 
 // constants
 // =
 
 const TABLE_VERSION = 1
+const JSON_TYPE = 'unwalled.garden/follows'
+const JSON_PATH = '/data/follows.json'
 
 // globals
 // =
@@ -19,20 +23,61 @@ exports.on = events.on.bind(events)
 exports.addListener = events.addListener.bind(events)
 exports.removeListener = events.removeListener.bind(events)
 
-exports.crawlSite = async function (archive) {
+exports.crawlSite = async function (archive, crawlSourceId) {
   return doCrawl(archive, 'crawl_followgraph', TABLE_VERSION, async ({changes, resetRequired}) => {
+    const supressEvents = resetRequired === true // dont emit when replaying old info
     if (resetRequired) {
       // reset all data
-      // TODO
+      await db.run(`
+        DELETE FROM crawl_followgraph WHERE crawlSourceId = ?
+      `, [crawlSourceId])
+      await doCheckpoint('crawl_followgraph', TABLE_VERSION, crawlSourceId, 0)
     }
 
-    // find files that need to be processed
-    // TODO
+    // did follows.json change?
+    var change = changes.find(c => c.path === JSON_PATH)
+    if (!change) {
+      return
+    }
+
+    // read and validate
+    try {
+      var followsJson = JSON.parse(await archive.pda.readFile(JSON_PATH, 'utf8'))
+      assert(typeof followsJson === 'object', 'File be an object')
+      assert(followsJson.type === 'unwalled.garden/follows', 'JSON type must be unwalled.garden/follows')
+      assert(Array.isArray(followsJson.follows), 'JSON follows must be an array of strings')
+      followsJson.follows = followsJson.follows.filter(v => typeof v === 'string')
+    } catch (err) {
+      debug('Failed to read follows file', {url: archive.url, err})
+      return
+    }
+
+    // diff against the current follows
+    var currentFollows = await listFollows(archive)
+    var newFollows = followsJson.urls
+    var adds = _difference(newFollows, currentFollows)
+    var removes = _difference(currentFollows, newFollows)
+
+    // write updates
+    for (let add of adds) {
+      await db.run(`
+        INSERT INTO crawl_followgraph (crawlSourceId, destUrl, crawledAt) VALUES (?, ?, ?)
+      `, [crawlSourceId, add, Date.now()])
+      if (!supressEvents) {
+        events.emit('follow-added', archive.url, add)
+      }
+    }
+    for (let remove of removes) {
+      await db.run(`
+        DELETE FROM crawl_followgraph WHERE crawlSourceId = ? AND destUrl = ?
+      `, [crawlSourceId, remove])
+      if (supressEvents) {
+        events.emit('follow-removed', archive.url, add)
+      }
+    }
 
-    // process the files
-    // TODO
-    // events.emit('follow-added', sourceUrl, subjectUrl)
-    // events.emit('follow-removed', sourceUrl, subjectUrl)
+    // write checkpoint as success
+    await doCheckpoint('crawl_followgraph', TABLE_VERSION, crawlSourceId, changes[changes.length - 1].version)
   })
 }
 
@@ -53,7 +98,7 @@ exports.listFollowers = async function (subject) {
 // List urls of sites that subject follows
 // - subject. String (URL).
 // - returns Array<String>
-exports.listFollows = async function (subject) {
+const listFollows = exports.listFollows = async function (subject) {
   var rows = await db.all(`
     SELECT crawl_followgraph.destUrl
       FROM crawl_followgraph
diff --git a/crawler/index.js b/crawler/index.js
index f87825f3..01ce5de9 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -52,9 +52,14 @@ exports.unwatchSite = async function (url) {
 async function crawlSite (archive) {
   var release = await lock('crawl:' + archive.url)
   try {
+    // insert crawl source
+    // TODO
+    var crawlSourceId = // TODO
+
+    // crawl individual sources
     await Promise.all([
-      posts.crawlSite(archive),
-      followgraph.crawlSite(archive)
+      posts.crawlSite(archive, crawlSourceId),
+      followgraph.crawlSite(archive, crawlSourceId)
     ])
   } finally {
     release()
diff --git a/crawler/posts.js b/crawler/posts.js
index 07479d75..a1eed7da 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -8,6 +8,8 @@ const {doCrawl} = require('./util')
 // =
 
 const TABLE_VERSION = 1
+const JSON_TYPE = 'unwalled.garden/post'
+const JSON_PATH_REGEX = /^\/data\/posts\/([^\/]+)\.json$/i
 
 // globals
 // =
@@ -21,21 +23,82 @@ exports.on = events.on.bind(events)
 exports.addListener = events.addListener.bind(events)
 exports.removeListener = events.removeListener.bind(events)
 
-exports.crawlSite = async function (archive) {
+exports.crawlSite = async function (archive, crawlSourceId) {
   return doCrawl(archive, 'crawl_posts', TABLE_VERSION, async ({changes, resetRequired}) => {
+    const supressEvents = resetRequired === true // dont emit when replaying old info
     if (resetRequired) {
       // reset all data
-      // TODO
+      await db.run(`
+        DELETE FROM crawl_posts WHERE crawlSourceId = ?
+      `, [crawlSourceId])
+      await doCheckpoint('crawl_posts', TABLE_VERSION, crawlSourceId, 0)
     }
 
-    // find files that need to be processed
-    // TODO
-
-    // process the files
-    // TODO
-    // events.emit('post-added', sourceUrl)
-    // events.emit('post-updated', sourceUrl)
-    // events.emit('post-removed', sourceUrl)
+    // collect changed posts
+    var changedPosts = [] // order matters, must be oldest to newest
+    changes.forEach(c => {
+      if (JSON_PATH_REGEX.test(c.path)) {
+        let i = changedPosts.findIndex(c2 => c2.path === c.path)
+        if (i) {
+          changedPosts.splice(i, 1) // remove from old position
+        }
+        changedPosts.push(c)
+      }
+    })
+
+    // read and apply each post in order
+    for (let changedPost of changedPosts) {
+      // TODO Currently the crawler will abort reading the feed if any post fails to load
+      //      this means that a single bad or unreachable file can stop the forward progress of post indexing
+      //      to solve this, we need to find a way to tolerate bad post-files without losing our ability to efficiently detect new posts
+      //      -prf
+      if (changedPost.type === 'del') {
+        // delete
+        await db.run(`
+          DELETE FROM crawl_posts WHERE crawlSourceId = ? AND pathname = ?
+        `, [crawlSourceId, changedPost.path])
+        events.emit('post-removed', archive.url)
+      } else {
+        // read and validate
+        let post
+        try {
+          post = JSON.parse(await archive.pda.readFile(changedPost.path, 'utf8'))
+          assert(typeof post === 'object', 'File be an object')
+          assert(post.type === 'unwalled.garden/post', 'JSON type must be unwalled.garden/post')
+          assert(typeof post.content === 'string', 'JSON content must be a string')
+          assert(typeof post.createdAt === 'string', 'JSON createdAt must be a date-time')
+          assert(!isNaN(Number(new Date(post.createdAt))), 'JSON createdAt must be a date-time')
+        } catch (err) {
+          debug('Failed to read post file', {url: archive.url, path: c.path, err})
+          return // abort indexing
+        }
+
+        // massage the post
+        post.createdAt = Number(new Date(post.createdAt))
+        post.updatedAt = Number(new Date(post.updatedAt))
+        if (isNaN(post.updatedAt)) post.updatedAt = 0 // value is optional
+
+        // upsert
+        let existingPost = await get(archive.url, c.path)
+        if (existingPost) {
+          await db.run(`
+            UPDATE crawl_posts
+              SET crawledAt = ?, content = ?, createdAt = ?, updatedAt = ?
+              WHERE crawlSourceId = ? AND pathname = ?
+          `, [Date.now(), post.content, post.createdAt, post.updatedAt, crawlSourceId, changedPost.path])
+          events.emit('post-updated', archive.url)
+        } else {
+          await db.run(`
+            INSERT INTO crawl_posts (crawlSourceId, pathname, crawledAt, content, createdAt, updatedAt)
+              VALUES (?, ?, ?, ?, ?, ?)
+          `, [crawlSourceId, changedPost.path, Date.now(), post.content, post.createdAt, post.updatedAt])
+          events.emit('post-added', archive.url)
+        }
+
+        // checkpoint our progress
+        await doCheckpoint('crawl_posts', TABLE_VERSION, crawlSourceId, changedPost.version)
+      }
+    }
   })
 }
 
@@ -74,7 +137,7 @@ exports.list = async function ({offset, limit, reverse, author} = {}) {
   return db.all(query, values)
 }
 
-exports.get = async function (url, pathname = undefined) {
+const get = exports.get = async function (url, pathname = undefined) {
   // validate & parse params
   if (url) {
     try { url = new URL(url) }
diff --git a/crawler/util.js b/crawler/util.js
index 303f25c0..59875905 100644
--- a/crawler/util.js
+++ b/crawler/util.js
@@ -42,4 +42,8 @@ exports.doCrawl = async function (archive, crawlDataset, crawlDatasetVersion, ha
   // upsert crawl state
   state.updatedAt = Date.now()
   // TODO
+}
+
+exports.doCheckpoint = async function (crawlDataset, crawlDatasetVersion, crawlSourceId, crawlSourceVersion) {
+  // TODO
 }
\ No newline at end of file
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index 46cbd6a7..e323dfa6 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -121,13 +121,11 @@ CREATE TABLE crawl_sources_meta (
 CREATE TABLE crawl_posts (
   crawlSourceId INTEGER NOT NULL,
   pathname TEXT NOT NULL,
+  crawledAt INTEGER,
 
-  type TEXT NOT NULL,
   content TEXT,
-
-  createdAt INTEGER DEFAULT (strftime('%s', 'now')),
-  updatedAt INTEGER DEFAULT (strftime('%s', 'now')),
-  crawledAt INTEGER DEFAULT (strftime('%s', 'now')),
+  createdAt INTEGER,
+  updatedAt INTEGER,
 
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
@@ -135,12 +133,11 @@ CREATE TABLE crawl_posts (
 -- crawled follows
 CREATE TABLE crawl_followgraph (
   crawlSourceId INTEGER NOT NULL,
+  crawledAt INTEGER,
   
   destUrl TEXT NOT NULL,
 
-  updatedAt INTEGER DEFAULT (strftime('%s', 'now')),
-  crawledAt INTEGER DEFAULT (strftime('%s', 'now')),
-
+  PRIMARY KEY (crawlSourceId, destUrl),
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
 
diff --git a/package.json b/package.json
index 9889a3bd..502fd75f 100644
--- a/package.json
+++ b/package.json
@@ -51,6 +51,7 @@
     "identify-filetype": "^1.0.0",
     "into-stream": "^3.1.0",
     "lodash.debounce": "^4.0.8",
+    "lodash.difference": "^4.5.0",
     "lodash.get": "^4.4.2",
     "lodash.isequal": "^4.5.0",
     "lodash.pick": "^4.4.0",
diff --git a/users/index.js b/users/index.js
index da8b72b4..2fae2f61 100644
--- a/users/index.js
+++ b/users/index.js
@@ -5,6 +5,11 @@ const db = require('../dbs/profile-data-db')
 const archivesDb = require('../dbs/archives')
 const debug = require('../lib/debug-logger').debugLogger('users')
 
+// constants
+// =
+
+const SITE_TYPE = 'unwalled.garden/user'
+
 // globals
 // =
 
@@ -174,6 +179,9 @@ async function validateUserUrl (url) {
   if (!meta.isOwner) {
     throw new Error('User dat is not owned by this device')
   }
+  if (!meta.type.includes(SITE_TYPE)) {
+    throw new Error('User dat is not the correct type')
+  }
   if (!userSettings.isSaved) {
     throw new Error('User dat has been deleted')
   }

From f592ca268630b201d7350922ee251d0885950f38 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 7 Dec 2018 20:32:35 -0600
Subject: [PATCH 005/245] Add write methods to crawler posts and followgraph

---
 crawler/followgraph.js | 76 ++++++++++++++++++++++++++++++++++--------
 crawler/posts.js       | 43 ++++++++++++++----------
 crawler/util.js        | 10 ++++++
 3 files changed, 98 insertions(+), 31 deletions(-)

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index f75d7a44..742ebaef 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -1,8 +1,10 @@
 const assert = require('assert')
 const _difference = require('lodash.difference')
 const Events = require('events')
+const lock = require('../lib/lock')
 const db = require('../dbs/profile-data-db')
 const {doCrawl, doCheckpoint} = require('./util')
+const debug = require('../lib/debug-logger').debugLogger('crawler')
 
 // constants
 // =
@@ -42,11 +44,7 @@ exports.crawlSite = async function (archive, crawlSourceId) {
 
     // read and validate
     try {
-      var followsJson = JSON.parse(await archive.pda.readFile(JSON_PATH, 'utf8'))
-      assert(typeof followsJson === 'object', 'File be an object')
-      assert(followsJson.type === 'unwalled.garden/follows', 'JSON type must be unwalled.garden/follows')
-      assert(Array.isArray(followsJson.follows), 'JSON follows must be an array of strings')
-      followsJson.follows = followsJson.follows.filter(v => typeof v === 'string')
+      var followsJson = await readFollowsFile(archive)
     } catch (err) {
       debug('Failed to read follows file', {url: archive.url, err})
       return
@@ -72,7 +70,7 @@ exports.crawlSite = async function (archive, crawlSourceId) {
         DELETE FROM crawl_followgraph WHERE crawlSourceId = ? AND destUrl = ?
       `, [crawlSourceId, remove])
       if (supressEvents) {
-        events.emit('follow-removed', archive.url, add)
+        events.emit('follow-removed', archive.url, remove)
       }
     }
 
@@ -125,16 +123,68 @@ exports.isAFollowingB = async function (a, b) {
   return !!res
 }
 
-exports.follow = function () {
-  throw new Error('Not yet implemented')
+exports.follow = function (archive, followUrl) {
+  // normalize followUrl
+  // TODO
+  assert(typeof followUrl === 'string', 'Follow() must be given a valid URL')
+
+  return updateFollowsFile(archive, followsJson => {
+    if (!followsJson.urls.find(v => v === followUrl)) {
+      followsJson.urls.push(followUrl)
+    }
+  })
+}
 
-  // update the user dat
+exports.unfollow = function (archive, followUrl) {
+  // normalize followUrl
   // TODO
+  assert(typeof followUrl === 'string', 'Unollow() must be given a valid URL')
+
+  return updateFollowsFile(archive, followsJson => {
+    var i = followsJson.urls.findIndex(v => v === followUrl)
+    if (i !== -1) {
+      followsJson.urls.splice(i, 1)
+    }
+  })
+}
+
+// internal methods
+// =
+
+async function readFollowsFile (archive) {
+  var followsJson = JSON.parse(await archive.pda.readFile(JSON_PATH, 'utf8'))
+  assert(typeof followsJson === 'object', 'File be an object')
+  assert(followsJson.type === JSON_TYPE, 'JSON type must be unwalled.garden/follows')
+  assert(Array.isArray(followsJson.follows), 'JSON follows must be an array of strings')
+  followsJson.follows = followsJson.follows.filter(v => typeof v === 'string')
+  return followsJson
 }
 
-exports.unfollow = function () {
-  throw new Error('Not yet implemented')
+async function updateFollowsFile (archive, updateFn) {
+  var release = await lock('crawler:followgraph:' + archive.url)
+  try {
+    // read the follows file
+    try {
+      var followsJson = await readFollowsFile(archive)
+    } catch (err) {
+      if (err.notFound) {
+        // create new
+        followsJson = {
+          type: JSON_TYPE,
+          urls: []
+        }
+      } else {
+        debug('Failed to read follows file', {url: archive.url, err})
+        throw err
+      }
+    }
 
-  // update the user dat
-  // TODO
+    // apply update
+    updateFn(followsJson)
+
+    // write the follows file
+    await archive.pda.readFile(JSON_PATH, JSON.stringify(followsJson), 'utf8')
+  } finally {
+    release()
+  }
 }
diff --git a/crawler/posts.js b/crawler/posts.js
index a1eed7da..9c2818d1 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -2,7 +2,8 @@ const assert = require('assert')
 const {URL} = require('url')
 const Events = require('events')
 const db = require('../dbs/profile-data-db')
-const {doCrawl} = require('./util')
+const {doCrawl, doCheckpoint, generateTimeFilename} = require('./util')
+const debug = require('../lib/debug-logger').debugLogger('crawler')
 
 // constants
 // =
@@ -69,7 +70,7 @@ exports.crawlSite = async function (archive, crawlSourceId) {
           assert(typeof post.createdAt === 'string', 'JSON createdAt must be a date-time')
           assert(!isNaN(Number(new Date(post.createdAt))), 'JSON createdAt must be a date-time')
         } catch (err) {
-          debug('Failed to read post file', {url: archive.url, path: c.path, err})
+          debug('Failed to read post file', {url: archive.url, path: changedPost.path, err})
           return // abort indexing
         }
 
@@ -79,7 +80,7 @@ exports.crawlSite = async function (archive, crawlSourceId) {
         if (isNaN(post.updatedAt)) post.updatedAt = 0 // value is optional
 
         // upsert
-        let existingPost = await get(archive.url, c.path)
+        let existingPost = await get(archive.url, changedPost.path)
         if (existingPost) {
           await db.run(`
             UPDATE crawl_posts
@@ -158,23 +159,29 @@ const get = exports.get = async function (url, pathname = undefined) {
   `, [url.origin, pathname])
 }
 
-exports.create = async function () {
-  throw new Error('Not yet implemented')
-
-  // update the user dat
-  // TODO
+exports.create = async function (archive, {content} = {}) {
+  assert(typeof content === 'string', 'Create() must be provided a `content` string')
+  var filename = generateTimeFilename()
+  await archive.writeFile(`/posts/${filename}.json`, JSON.stringify({
+    type: JSON_TYPE,
+    content,
+    createdAt: (new Date()).toISOString()
+  }))
 }
 
-exports.edit = async function () {
-  throw new Error('Not yet implemented')
-
-  // update the user dat
-  // TODO
+exports.edit = async function (archive, pathname, {content} = {}) {
+  assert(typeof pathname === 'string', 'Edit() must be provided a valid URL string')
+  assert(typeof content === 'string', 'Edit() must be provided a `content` string')
+  var oldJson = JSON.parse(await archive.readFile(pathname))
+  await archive.writeFile(pathname, JSON.stringify({
+    type: JSON_TYPE,
+    content,
+    createdAt: oldJson.createdAt,
+    updatedAt: (new Date()).toISOString()
+  }))
 }
 
-exports.delete = async function () {
-  throw new Error('Not yet implemented')
-
-  // update the user dat
-  // TODO
+exports.delete = async function (archive, pathname) {
+  assert(typeof pathname === 'string', 'Delete() must be provided a valid URL string')
+  await archive.unlink(pathname)
 }
diff --git a/crawler/util.js b/crawler/util.js
index 59875905..f201aeb2 100644
--- a/crawler/util.js
+++ b/crawler/util.js
@@ -46,4 +46,14 @@ exports.doCrawl = async function (archive, crawlDataset, crawlDatasetVersion, ha
 
 exports.doCheckpoint = async function (crawlDataset, crawlDatasetVersion, crawlSourceId, crawlSourceVersion) {
   // TODO
+}
+
+var _lastGeneratedTimeFilename
+exports.generateTimeFilename = function () {
+  var d = Date.now()
+  if (d === _lastGeneratedTimeFilename) {
+    d++
+  }
+  _lastGeneratedTimeFilename = d
+  return (new Date(d)).toISOString()
 }
\ No newline at end of file

From bd112319b1839f0c356c26fdb256f6db94f9fa0e Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 8 Dec 2018 15:21:35 -0600
Subject: [PATCH 006/245] Implement remaining crawler logic

---
 crawler/followgraph.js | 18 ++++++++++++++----
 crawler/index.js       | 10 +++++++---
 crawler/posts.js       |  4 ++--
 crawler/util.js        | 43 +++++++++++++++++++++---------------------
 dbs/profile-data-db.js |  2 ++
 5 files changed, 46 insertions(+), 31 deletions(-)

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index 742ebaef..3d1b9421 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -1,6 +1,7 @@
 const assert = require('assert')
 const _difference = require('lodash.difference')
 const Events = require('events')
+const {Url} = require('url')
 const lock = require('../lib/lock')
 const db = require('../dbs/profile-data-db')
 const {doCrawl, doCheckpoint} = require('./util')
@@ -26,7 +27,7 @@ exports.addListener = events.addListener.bind(events)
 exports.removeListener = events.removeListener.bind(events)
 
 exports.crawlSite = async function (archive, crawlSourceId) {
-  return doCrawl(archive, 'crawl_followgraph', TABLE_VERSION, async ({changes, resetRequired}) => {
+  return doCrawl(archive, crawlSourceId, 'crawl_followgraph', TABLE_VERSION, async ({changes, resetRequired}) => {
     const supressEvents = resetRequired === true // dont emit when replaying old info
     if (resetRequired) {
       // reset all data
@@ -125,7 +126,7 @@ exports.isAFollowingB = async function (a, b) {
 
 exports.follow = function (archive, followUrl) {
   // normalize followUrl
-  // TODO
+  followUrl = normalizeFollowUrl(followUrl)
   assert(typeof followUrl === 'string', 'Follow() must be given a valid URL')
 
   return updateFollowsFile(archive, followsJson => {
@@ -137,8 +138,8 @@ exports.follow = function (archive, followUrl) {
 
 exports.unfollow = function (archive, followUrl) {
   // normalize followUrl
-  // TODO
-  assert(typeof followUrl === 'string', 'Unollow() must be given a valid URL')
+  followUrl = normalizeFollowUrl(followUrl)
+  assert(typeof followUrl === 'string', 'Unfollow() must be given a valid URL')
 
   return updateFollowsFile(archive, followsJson => {
     var i = followsJson.urls.findIndex(v => v === followUrl)
@@ -151,6 +152,15 @@ exports.unfollow = function (archive, followUrl) {
 // internal methods
 // =
 
+function normalizeFollowUrl (url) {
+  try {
+    url = new URL(url)
+    return url.origin
+  } catch (e) {
+    return null
+  }
+}
+
 async function readFollowsFile (archive) {
   var followsJson = JSON.parse(await archive.pda.readFile(JSON_PATH, 'utf8'))
   assert(typeof followsJson === 'object', 'File be an object')
diff --git a/crawler/index.js b/crawler/index.js
index 01ce5de9..2e20e7bb 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -1,5 +1,6 @@
 const _throttle = require('lodash.throttle')
 const lock = require('../lib/lock')
+const db = require('../dbs/profile-data-db')
 const users = require('../users')
 const dat = require('../dat')
 
@@ -52,9 +53,12 @@ exports.unwatchSite = async function (url) {
 async function crawlSite (archive) {
   var release = await lock('crawl:' + archive.url)
   try {
-    // insert crawl source
-    // TODO
-    var crawlSourceId = // TODO
+    // get/create crawl source
+    var crawlSourceId = await db.run(`SELECT id FROM crawl_sources WHERE url = ?`, [archive.url])
+    if (!crawlSourceId) {
+      await db.run(`INSERT INTO crawl_sources (url) VALUES (?)`, [archive.url])
+      crawlSourceId = db.getSqliteInstance().lastID
+    }
 
     // crawl individual sources
     await Promise.all([
diff --git a/crawler/posts.js b/crawler/posts.js
index 9c2818d1..dc797c9a 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -10,7 +10,7 @@ const debug = require('../lib/debug-logger').debugLogger('crawler')
 
 const TABLE_VERSION = 1
 const JSON_TYPE = 'unwalled.garden/post'
-const JSON_PATH_REGEX = /^\/data\/posts\/([^\/]+)\.json$/i
+const JSON_PATH_REGEX = /^\/data\/posts\/([^/]+)\.json$/i
 
 // globals
 // =
@@ -25,7 +25,7 @@ exports.addListener = events.addListener.bind(events)
 exports.removeListener = events.removeListener.bind(events)
 
 exports.crawlSite = async function (archive, crawlSourceId) {
-  return doCrawl(archive, 'crawl_posts', TABLE_VERSION, async ({changes, resetRequired}) => {
+  return doCrawl(archive, crawlSourceId, 'crawl_posts', TABLE_VERSION, async ({changes, resetRequired}) => {
     const supressEvents = resetRequired === true // dont emit when replaying old info
     if (resetRequired) {
       // reset all data
diff --git a/crawler/util.js b/crawler/util.js
index f201aeb2..8a7973fe 100644
--- a/crawler/util.js
+++ b/crawler/util.js
@@ -1,12 +1,15 @@
 const db = require('../dbs/profile-data-db')
+const dat = require('../dat')
 
-exports.doCrawl = async function (archive, crawlDataset, crawlDatasetVersion, handlerFn) {
+const READ_TIMEOUT = 30e3
+
+exports.doCrawl = async function (archive, crawlSourceId, crawlDataset, crawlDatasetVersion, handlerFn) {
   const url = archive.url
 
   // fetch current crawl state
   var resetRequired = false
   var state = await db.get(`
-    SELECT crawl_sources_meta.* FROM crawl_sources_meta
+    SELECT crawl_sources_meta.crawlSourceVersion FROM crawl_sources_meta
       INNER JOIN crawl_sources ON crawl_sources.url = ?
       WHERE crawl_sources_meta.crawlDataset = ?
   `, [url, crawlDataset])
@@ -15,37 +18,33 @@ exports.doCrawl = async function (archive, crawlDataset, crawlDatasetVersion, ha
     state = null
   }
   if (!state) {
-    // new state
-    state = {
-      crawlSourceId: null,
-      url,
-      crawlDataset,
-      crawlDatasetVersion,
-      updatedAt: 0
-    }
+    state = {crawlSourceVersion: 0}
   }
 
   // fetch current archive version
-  // TODO
+  var archiveInfo = await dat.library.getDaemon().getArchiveInfo(archive.key)
+  var version = archiveInfo ? archiveInfo.version : 0
 
   // fetch change log
-  var changes = [] // TODO
+  var start = state.crawlSourceVersion
+  var end = version
+  var changes = await new Promise((resolve, reject) => {
+    archive.history({start, end, timeout: READ_TIMEOUT}, (err, c) => {
+      if (err) reject(err)
+      else resolve(c)
+    })
+  })
 
   // handle changes
   await handlerFn({changes, resetRequired})
-
-  if (!state.crawlSourceId) {
-    // upsert crawl source
-    // TODO
-  }
-
-  // upsert crawl state
-  state.updatedAt = Date.now()
-  // TODO
 }
 
 exports.doCheckpoint = async function (crawlDataset, crawlDatasetVersion, crawlSourceId, crawlSourceVersion) {
-  // TODO
+  await db.run(`
+    INSERT OR REPLACE
+      INTO crawl_sources_meta (crawlDataset, crawlDatasetVersion, crawlSourceId, crawlSourceVersion, updatedAt)
+      VALUES (?, ?, ?, ?, ?)
+  `, [crawlDataset, crawlDatasetVersion, crawlSourceId, crawlSourceVersion, Date.now()])
 }
 
 var _lastGeneratedTimeFilename
diff --git a/dbs/profile-data-db.js b/dbs/profile-data-db.js
index 59734685..677af760 100644
--- a/dbs/profile-data-db.js
+++ b/dbs/profile-data-db.js
@@ -44,6 +44,8 @@ exports.parallelize = function () {
   return db.parallelize()
 }
 
+exports.getSqliteInstance = () => db
+
 // internal methods
 // =
 

From 8af6f4f0c76ca4392ddae5b05bf6fbb04ec6771c Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 8 Dec 2018 15:46:59 -0600
Subject: [PATCH 007/245] Implement followgraph web api

---
 web-apis/bg.js                             |  4 +-
 web-apis/bg/followgraph.js                 | 66 ++++++++++++++++++++++
 web-apis/fg/beaker.js                      |  5 +-
 web-apis/manifests/internal/followgraph.js |  5 +-
 4 files changed, 74 insertions(+), 6 deletions(-)
 create mode 100644 web-apis/bg/followgraph.js

diff --git a/web-apis/bg.js b/web-apis/bg.js
index 6702b4cb..e3d16b38 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -19,8 +19,8 @@ const bookmarksAPI = require('./bg/bookmarks')
 const historyAPI = require('./bg/history')
 const sitedataAPI = require('../dbs/sitedata').WEBAPI
 const watchlistAPI = require('./bg/watchlist')
-const postsAPI = require('../crawler/posts')
-const followgraphAPI = require('../crawler/followgraph')
+const postsAPI = require('./bg/posts')
+const followgraphAPI = require('./bg/followgraph')
 
 // external manifests
 const datArchiveManifest = require('./manifests/external/dat-archive')
diff --git a/web-apis/bg/followgraph.js b/web-apis/bg/followgraph.js
new file mode 100644
index 00000000..e0d8b9de
--- /dev/null
+++ b/web-apis/bg/followgraph.js
@@ -0,0 +1,66 @@
+const globals = require('../../globals')
+const assert = require('assert')
+const {Url} = require('url')
+const {PermissionsError} = require('beaker-error-constants')
+const dat = require('../../dat')
+const followgraphCrawler = require('../../crawler/followgraph')
+
+// exported api
+// =
+
+module.exports = {
+
+  async listFollowers (url) {
+    url = normalizeFollowUrl(url)
+    assertString(url, 'Parameter one must be a URL')
+    return followgraphCrawler.listFollowers(url)
+  },
+
+  async listFollows (url) {
+    url = normalizeFollowUrl(url)
+    assertString(url, 'Parameter one must be a URL')
+    return followgraphCrawler.listFollows(url)
+  },
+
+  async isAFollowingB (a, b) {
+    a = normalizeFollowUrl(a)
+    b = normalizeFollowUrl(b)
+    assertString(a, 'Parameter one must be a URL')
+    assertString(b, 'Parameter two must be a URL')
+    return followgraphCrawler.isAFollowingB(a, b)
+  },
+
+  async follow (url) {
+    url = normalizeFollowUrl(url)
+    assertString(url, 'Parameter one must be a URL')
+    var userSession = globals.getUserSessionFor(this.sender)
+    if (!userSession) throw new Error('No active user session')
+    var userArchive = dat.library.getArchive(userSession.url)
+    return followgraphCrawler.follow(userArchive, url)
+  },
+
+  async unfollow (url) {
+    url = normalizeFollowUrl(url)
+    assertString(url, 'Parameter one must be a URL')
+    var userSession = globals.getUserSessionFor(this.sender)
+    if (!userSession) throw new Error('No active user session')
+    var userArchive = dat.library.getArchive(userSession.url)
+    return followgraphCrawler.follow(userArchive, url)
+  }
+}
+
+// internal methods
+// =
+
+function normalizeFollowUrl (url) {
+  try {
+    url = new URL(url)
+    return url.origin
+  } catch (e) {
+    return null
+  }
+}
+
+function assertString (v, msg) {
+  assert(!!v && typeof v === 'string', msg)
+}
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index f356c463..a2af512d 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -161,8 +161,9 @@ exports.setup = function (rpc) {
     beaker.posts.delete = postsRPC.delete
 
     // beaker.followgraph
-    beaker.followgraph.queryall = followgraphRPC.queryall
-    beaker.followgraph.query = followgraphRPC.query
+    beaker.followgraph.listFollowers = followgraphRPC.listFollowers
+    beaker.followgraph.listFollows = followgraphRPC.listFollows
+    beaker.followgraph.isAFollowingB = followgraphRPC.isAFollowingB
     beaker.followgraph.follow = followgraphRPC.follow
     beaker.followgraph.unfollow = followgraphRPC.unfollow
   }
diff --git a/web-apis/manifests/internal/followgraph.js b/web-apis/manifests/internal/followgraph.js
index 8c8549c8..2cb0fd6d 100644
--- a/web-apis/manifests/internal/followgraph.js
+++ b/web-apis/manifests/internal/followgraph.js
@@ -1,6 +1,7 @@
 module.exports = {
-  queryAll: 'promise',
-  query: 'promise',
+  listFollowers: 'promise',
+  listFollows: 'promise',
+  isAFollowingB: 'promise',
   follow: 'promise',
   unfollow: 'promise'
 }
\ No newline at end of file

From cfd8a6ad9f3639212c045da7cac5af9f38ea8a39 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 8 Dec 2018 16:09:46 -0600
Subject: [PATCH 008/245] Add posts web api

---
 web-apis/bg/posts.js | 54 ++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 54 insertions(+)
 create mode 100644 web-apis/bg/posts.js

diff --git a/web-apis/bg/posts.js b/web-apis/bg/posts.js
new file mode 100644
index 00000000..8be750c1
--- /dev/null
+++ b/web-apis/bg/posts.js
@@ -0,0 +1,54 @@
+const globals = require('../../globals')
+const assert = require('assert')
+const {Url} = require('url')
+const {PermissionsError} = require('beaker-error-constants')
+const dat = require('../../dat')
+const postsCrawler = require('../../crawler/posts')
+
+// exported api
+// =
+
+module.exports = {
+
+  async list ({offset, limit, reverse, author} = {}) {
+    // validate & parse params
+    assert(!offset || typeof offset === 'number', 'Offset must be a number')
+    assert(!limit || typeof limit === 'number', 'Limit must be a number')
+    assert(!reverse || typeof reverse === 'boolean', 'Reverse must be a boolean')
+    assert(!author || typeof author === 'string', 'Author must be a string')
+    if (author) {
+      try { author = new URL(author) }
+      catch (e) { throw new Error('Failed to parse author URL: ' + author) }
+    }
+    return postsCrawler.list({offset, limit, reverse, author})
+  },
+
+  async get (origin, pathname = undefined) {
+    return postsCrawler.get(origin, pathname)
+  },
+
+  async create ({content} = {}) {
+    assert(typeof content === 'string', 'Create() must be provided a `content` string')
+    var userSession = globals.getUserSessionFor(this.sender)
+    if (!userSession) throw new Error('No active user session')
+    var userArchive = dat.library.getArchive(userSession.url)
+    return postsCrawler.create(userArchive, {content})
+  },
+
+  async edit (pathname, {content} = {}) {
+    assert(typeof pathname === 'string', 'Edit() must be provided a valid URL string')
+    assert(typeof content === 'string', 'Edit() must be provided a `content` string')
+    var userSession = globals.getUserSessionFor(this.sender)
+    if (!userSession) throw new Error('No active user session')
+    var userArchive = dat.library.getArchive(userSession.url)
+    return postsCrawler.edit(userArchive, pathname, {content})
+  },
+
+  async delete (pathname) {
+    assert(typeof pathname === 'string', 'Edit() must be provided a valid URL string')
+    var userSession = globals.getUserSessionFor(this.sender)
+    if (!userSession) throw new Error('No active user session')
+    var userArchive = dat.library.getArchive(userSession.url)
+    return postsCrawler.delete(userArchive, pathname)
+  }
+}
\ No newline at end of file

From 1f22b4dfabfd3befc8d0104e4c6aab5c99695f71 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 8 Dec 2018 16:15:37 -0600
Subject: [PATCH 009/245] Add crawler sqlite delta

---
 dbs/profile-data-db.js              |  1 +
 dbs/schemas/profile-data.sql.js     |  2 +-
 dbs/schemas/profile-data.v24.sql.js | 52 +++++++++++++++++++++++++++++
 3 files changed, 54 insertions(+), 1 deletion(-)
 create mode 100644 dbs/schemas/profile-data.v24.sql.js

diff --git a/dbs/profile-data-db.js b/dbs/profile-data-db.js
index 677af760..ada82a01 100644
--- a/dbs/profile-data-db.js
+++ b/dbs/profile-data-db.js
@@ -76,6 +76,7 @@ migrations = [
   migration('profile-data.v21.sql'),
   migration('profile-data.v22.sql', {canFail: true}), // canFail for the same reason as v16, ffs
   migration('profile-data.v23.sql'),
+  migration('profile-data.v24.sql')
 ]
 function migration (file, opts = {}) {
   return cb => {
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index e323dfa6..8568a698 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -217,5 +217,5 @@ INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Report an issu
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Explore the p2p Web', 'dat://taravancil.com/explore-the-p2p-web.md', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker', 'https://opencollective.com/beaker', 1);
 
-PRAGMA user_version = 23;
+PRAGMA user_version = 24;
 `
diff --git a/dbs/schemas/profile-data.v24.sql.js b/dbs/schemas/profile-data.v24.sql.js
new file mode 100644
index 00000000..cc3653b8
--- /dev/null
+++ b/dbs/schemas/profile-data.v24.sql.js
@@ -0,0 +1,52 @@
+module.exports = `
+
+CREATE TABLE users (
+  id INTEGER PRIMARY KEY NOT NULL,
+  url TEXT,
+  isDefault INTEGER DEFAULT 0,
+  createdAt INTEGER
+);
+
+-- list of sites being crawled
+CREATE TABLE crawl_sources (
+  id INTEGER PRIMARY KEY NOT NULL,
+  url TEXT NOT NULL
+);
+
+-- tracking information on the crawl-state of the sources
+CREATE TABLE crawl_sources_meta (
+  crawlSourceId INTEGER NOT NULL,
+  crawlSourceVersion INTEGER NOT NULL,
+  crawlDataset TEXT NOT NULL,
+  crawlDatasetVersion INTEGER NOT NULL,
+  updatedAt INTEGER DEFAULT,
+
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+
+-- crawled posts
+CREATE TABLE crawl_posts (
+  crawlSourceId INTEGER NOT NULL,
+  pathname TEXT NOT NULL,
+  crawledAt INTEGER,
+
+  content TEXT,
+  createdAt INTEGER,
+  updatedAt INTEGER,
+
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+
+-- crawled follows
+CREATE TABLE crawl_followgraph (
+  crawlSourceId INTEGER NOT NULL,
+  crawledAt INTEGER,
+  
+  destUrl TEXT NOT NULL,
+
+  PRIMARY KEY (crawlSourceId, destUrl),
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+
+PRAGMA user_version = 24;
+`
\ No newline at end of file

From d7b3fa2a84eedabafe0f0824d589ee32968e3091 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 8 Dec 2018 16:16:22 -0600
Subject: [PATCH 010/245] Add userSessionAPI interface

---
 README.md                  | 9 ++++++++-
 globals.js                 | 3 ++-
 index.js                   | 3 +++
 web-apis/bg/followgraph.js | 4 ++--
 web-apis/bg/posts.js       | 6 +++---
 5 files changed, 18 insertions(+), 7 deletions(-)

diff --git a/README.md b/README.md
index df6f1065..65436571 100644
--- a/README.md
+++ b/README.md
@@ -43,7 +43,10 @@ await beakerCore.setup({
     exportAPI(apiName, apiManifest, apiImpl, [guardFn])
   },
   downloadsWebAPI: {...},
-  browserWebAPI: {...}
+  browserWebAPI: {...},
+  userSessionAPI: {
+    getFor(webContents) {/*...*/}
+  }
 })
 
 // setup the protocol handler
@@ -115,6 +118,10 @@ debug('dat-related stuff')
 
 ### `dat.debug`
 
+### `crawler`
+
+### `users`
+
 ## API (@beaker/core/webview)
 
 ### `setup()`
\ No newline at end of file
diff --git a/globals.js b/globals.js
index 31516b70..a76cda47 100644
--- a/globals.js
+++ b/globals.js
@@ -10,5 +10,6 @@ module.exports = {
   uiAPI: null,
   rpcAPI: null,
   downloadsWebAPI: null,
-  browserWebAPI: null
+  browserWebAPI: null,
+  userSessionAPI: null
 }
diff --git a/index.js b/index.js
index 7f46ea90..28c92013 100644
--- a/index.js
+++ b/index.js
@@ -16,6 +16,8 @@ module.exports = {
   globals,
   dat,
   dbs,
+  crawler,
+  users,
   spellChecker,
 
   debugLogger: debugLogger.debugLogger,
@@ -32,6 +34,7 @@ module.exports = {
     assert(!!opts.rpcAPI, 'must provide rpcAPI')
     assert(!!opts.downloadsWebAPI, 'must provide downloadsWebAPI')
     assert(!!opts.browserWebAPI, 'must provide browserWebAPI')
+    assert(!!opts.userSessionAPI, 'must provide userSessionAPI')
 
     for (let k in opts) {
       globals[k] = opts[k]
diff --git a/web-apis/bg/followgraph.js b/web-apis/bg/followgraph.js
index e0d8b9de..3ac7c14b 100644
--- a/web-apis/bg/followgraph.js
+++ b/web-apis/bg/followgraph.js
@@ -33,7 +33,7 @@ module.exports = {
   async follow (url) {
     url = normalizeFollowUrl(url)
     assertString(url, 'Parameter one must be a URL')
-    var userSession = globals.getUserSessionFor(this.sender)
+    var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
     var userArchive = dat.library.getArchive(userSession.url)
     return followgraphCrawler.follow(userArchive, url)
@@ -42,7 +42,7 @@ module.exports = {
   async unfollow (url) {
     url = normalizeFollowUrl(url)
     assertString(url, 'Parameter one must be a URL')
-    var userSession = globals.getUserSessionFor(this.sender)
+    var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
     var userArchive = dat.library.getArchive(userSession.url)
     return followgraphCrawler.follow(userArchive, url)
diff --git a/web-apis/bg/posts.js b/web-apis/bg/posts.js
index 8be750c1..d7c5e623 100644
--- a/web-apis/bg/posts.js
+++ b/web-apis/bg/posts.js
@@ -29,7 +29,7 @@ module.exports = {
 
   async create ({content} = {}) {
     assert(typeof content === 'string', 'Create() must be provided a `content` string')
-    var userSession = globals.getUserSessionFor(this.sender)
+    var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
     var userArchive = dat.library.getArchive(userSession.url)
     return postsCrawler.create(userArchive, {content})
@@ -38,7 +38,7 @@ module.exports = {
   async edit (pathname, {content} = {}) {
     assert(typeof pathname === 'string', 'Edit() must be provided a valid URL string')
     assert(typeof content === 'string', 'Edit() must be provided a `content` string')
-    var userSession = globals.getUserSessionFor(this.sender)
+    var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
     var userArchive = dat.library.getArchive(userSession.url)
     return postsCrawler.edit(userArchive, pathname, {content})
@@ -46,7 +46,7 @@ module.exports = {
 
   async delete (pathname) {
     assert(typeof pathname === 'string', 'Edit() must be provided a valid URL string')
-    var userSession = globals.getUserSessionFor(this.sender)
+    var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
     var userArchive = dat.library.getArchive(userSession.url)
     return postsCrawler.delete(userArchive, pathname)

From 3f3400bb357dd5d1be43239bea7419c409c43216 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 8 Dec 2018 17:10:06 -0600
Subject: [PATCH 011/245] Add getUserSession/setUserSession to beaker.browser
 api

---
 web-apis/fg/beaker.js                  | 2 ++
 web-apis/manifests/internal/browser.js | 3 +++
 2 files changed, 5 insertions(+)

diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index a2af512d..213b4a2b 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -71,6 +71,8 @@ exports.setup = function (rpc) {
     beaker.browser.getInfo = beakerBrowserRPC.getInfo
     beaker.browser.checkForUpdates = beakerBrowserRPC.checkForUpdates
     beaker.browser.restartBrowser = beakerBrowserRPC.restartBrowser
+    beaker.browser.getUserSession = beakerBrowserRPC.getUserSession
+    beaker.browser.setUserSession = beakerBrowserRPC.setUserSession
     beaker.browser.getSetting = beakerBrowserRPC.getSetting
     beaker.browser.getSettings = beakerBrowserRPC.getSettings
     beaker.browser.setSetting = beakerBrowserRPC.setSetting
diff --git a/web-apis/manifests/internal/browser.js b/web-apis/manifests/internal/browser.js
index b14a1b0c..cd1c7743 100644
--- a/web-apis/manifests/internal/browser.js
+++ b/web-apis/manifests/internal/browser.js
@@ -4,6 +4,9 @@ module.exports = {
   checkForUpdates: 'promise',
   restartBrowser: 'sync',
 
+  getUserSession: 'promise',
+  setUserSession: 'promise',
+
   getSettings: 'promise',
   getSetting: 'promise',
   setSetting: 'promise',

From 1eb42a6a90e10ec76557db832154123a7434fdbb Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 8 Dec 2018 18:53:52 -0600
Subject: [PATCH 012/245] Fixes

---
 dat/library.js                      |  1 +
 dat/watchlist.js                    |  3 +++
 dbs/archives.js                     |  4 ++--
 dbs/schemas/profile-data.sql.js     |  2 +-
 dbs/schemas/profile-data.v24.sql.js |  2 +-
 package-lock.json                   | 15 ++++++---------
 users/index.js                      |  4 ++--
 web-apis/fg/beaker.js               |  2 ++
 8 files changed, 18 insertions(+), 15 deletions(-)

diff --git a/dat/library.js b/dat/library.js
index 1cb63df5..3c0af69c 100644
--- a/dat/library.js
+++ b/dat/library.js
@@ -358,6 +358,7 @@ exports.getActiveArchives = function getActiveArchives () {
 }
 
 const getOrLoadArchive = exports.getOrLoadArchive = async function getOrLoadArchive (key, opts) {
+  key = fromURLToKey(key)
   var archive = getArchive(key)
   if (archive) {
     return archive
diff --git a/dat/watchlist.js b/dat/watchlist.js
index f8814556..3c4bdc93 100644
--- a/dat/watchlist.js
+++ b/dat/watchlist.js
@@ -1,5 +1,6 @@
 const EventEmitter = require('events')
 const emitStream = require('emit-stream')
+const debug = require('../lib/debug-logger').debugLogger('datwatchlist')
 
 // dat modules
 const datLibrary = require('../dat/library')
@@ -21,6 +22,8 @@ exports.setup = async function setup () {
       watch(site)
     }
   } catch (err) {
+    console.error(err)
+    debug('Error while loading watchlist', err)
     throw new Error('Failed to load the watchlist')
   }
 }
diff --git a/dbs/archives.js b/dbs/archives.js
index a14783cc..99977b5e 100644
--- a/dbs/archives.js
+++ b/dbs/archives.js
@@ -228,7 +228,7 @@ exports.touch = async function (key, timeVar = 'lastAccessTime', value = -1) {
 // - supresses a not-found with an empty object
 const getUserSettings = exports.getUserSettings = async function (profileId, key) {
   // massage inputs
-  key = datEncoding.toStr(key)
+  key = typeof key !== 'string' ? datEncoding.toStr(key) : key
 
   // validate inputs
   if (!DAT_HASH_REGEX.test(key)) {
@@ -362,7 +362,7 @@ exports.setUserSettings = async function (profileId, key, newValues = {}) {
 // - supresses a not-found with an empty object
 const getMeta = exports.getMeta = async function (key) {
   // massage inputs
-  key = datEncoding.toStr(key)
+  key = typeof key !== 'string' ? datEncoding.toStr(key) : key
 
   // validate inputs
   if (!DAT_HASH_REGEX.test(key)) {
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index 8568a698..6cb2e383 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -112,7 +112,7 @@ CREATE TABLE crawl_sources_meta (
   crawlSourceVersion INTEGER NOT NULL,
   crawlDataset TEXT NOT NULL,
   crawlDatasetVersion INTEGER NOT NULL,
-  updatedAt INTEGER DEFAULT,
+  updatedAt INTEGER,
 
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
diff --git a/dbs/schemas/profile-data.v24.sql.js b/dbs/schemas/profile-data.v24.sql.js
index cc3653b8..2f769b70 100644
--- a/dbs/schemas/profile-data.v24.sql.js
+++ b/dbs/schemas/profile-data.v24.sql.js
@@ -19,7 +19,7 @@ CREATE TABLE crawl_sources_meta (
   crawlSourceVersion INTEGER NOT NULL,
   crawlDataset TEXT NOT NULL,
   crawlDatasetVersion INTEGER NOT NULL,
-  updatedAt INTEGER DEFAULT,
+  updatedAt INTEGER,
 
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
diff --git a/package-lock.json b/package-lock.json
index 130e07fa..bd6543ca 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -2326,6 +2326,11 @@
       "resolved": "https://registry.npmjs.org/lodash.debounce/-/lodash.debounce-4.0.8.tgz",
       "integrity": "sha1-gteb/zCmfEAF/9XiUVMArZyk168="
     },
+    "lodash.difference": {
+      "version": "4.5.0",
+      "resolved": "https://registry.npmjs.org/lodash.difference/-/lodash.difference-4.5.0.tgz",
+      "integrity": "sha1-nMtOUF1Ia5FlE0V3KIWi3yf9AXw="
+    },
     "lodash.get": {
       "version": "4.4.2",
       "resolved": "https://registry.npmjs.org/lodash.get/-/lodash.get-4.4.2.tgz",
@@ -2361,15 +2366,7 @@
       "dev": true,
       "requires": {
         "pseudomap": "^1.0.2",
-        "yallist": "^2.1.2"
-      },
-      "dependencies": {
-        "yallist": {
-          "version": "2.1.2",
-          "resolved": "https://registry.npmjs.org/yallist/-/yallist-2.1.2.tgz",
-          "integrity": "sha1-HBH5IY8HYImkfdUS+TxmmaaoHVI=",
-          "dev": true
-        }
+        "yallist": "^3.0.2"
       }
     },
     "map-age-cleaner": {
diff --git a/users/index.js b/users/index.js
index 2fae2f61..8e96a481 100644
--- a/users/index.js
+++ b/users/index.js
@@ -48,7 +48,7 @@ exports.setup = async function () {
   })
 }
 
-exports.getAll = async function () {
+exports.list = async function () {
   return Promise.all(users.map(fetchUserInfo))
 }
 
@@ -174,7 +174,7 @@ async function validateUserUrl (url) {
   var urlp = new URL(url)
   var [meta, userSettings] = await Promise.all([
     archivesDb.getMeta(urlp.hostname),
-    archivesDb.getUserSettings(urlp.hostname)
+    archivesDb.getUserSettings(0, urlp.hostname)
   ])
   if (!meta.isOwner) {
     throw new Error('User dat is not owned by this device')
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index 213b4a2b..b3d4de13 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -156,6 +156,7 @@ exports.setup = function (rpc) {
     beaker.watchlist.createEventsStream = () => fromEventStream(watchlistRPC.createEventsStream())
 
     // beaker.posts
+    beaker.posts = {}
     beaker.posts.list = postsRPC.list
     beaker.posts.get = postsRPC.get
     beaker.posts.create = postsRPC.create
@@ -163,6 +164,7 @@ exports.setup = function (rpc) {
     beaker.posts.delete = postsRPC.delete
 
     // beaker.followgraph
+    beaker.followgraph = {}
     beaker.followgraph.listFollowers = followgraphRPC.listFollowers
     beaker.followgraph.listFollows = followgraphRPC.listFollows
     beaker.followgraph.isAFollowingB = followgraphRPC.isAFollowingB

From 99d71ec45d0761a5d834108c329f8396d13d0d78 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 8 Dec 2018 20:32:30 -0600
Subject: [PATCH 013/245] Fixes

---
 crawler/util.js | 2 +-
 dbs/archives.js | 2 +-
 users/index.js  | 1 +
 3 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/crawler/util.js b/crawler/util.js
index 8a7973fe..60daffaa 100644
--- a/crawler/util.js
+++ b/crawler/util.js
@@ -13,7 +13,7 @@ exports.doCrawl = async function (archive, crawlSourceId, crawlDataset, crawlDat
       INNER JOIN crawl_sources ON crawl_sources.url = ?
       WHERE crawl_sources_meta.crawlDataset = ?
   `, [url, crawlDataset])
-  if (state.crawlDatasetVersion !== crawlDatasetVersion) {
+  if (state && state.crawlDatasetVersion !== crawlDatasetVersion) {
     resetRequired = true
     state = null
   }
diff --git a/dbs/archives.js b/dbs/archives.js
index 99977b5e..85433822 100644
--- a/dbs/archives.js
+++ b/dbs/archives.js
@@ -278,7 +278,7 @@ exports.setUserSettings = async function (profileId, key, newValues = {}) {
         autoDownload: ('autoDownload' in newValues) ? newValues.autoDownload : newValues.isSaved,
         autoUpload: ('autoUpload' in newValues) ? newValues.autoUpload : newValues.isSaved,
         expiresAt: newValues.expiresAt,
-        localSyncPath: ('localSyncPath' in newValues) ? newValues.localSyncPath : '',
+        localSyncPath: (newValues.localSyncPath) ? newValues.localSyncPath : '',
         previewMode: ('previewMode' in newValues) ? newValues.previewMode : ''
       }
       let valueArray = [
diff --git a/users/index.js b/users/index.js
index 8e96a481..e31b3024 100644
--- a/users/index.js
+++ b/users/index.js
@@ -85,6 +85,7 @@ exports.add = async function (url) {
     `INSERT INTO users (url, isDefault, createdAt) VALUES (?, ?, ?)`,
     [user.url, Number(user.isDefault), user.createdAt]
   )
+  users.push(user)
 
   // fetch the user archive
   user.archive = await dat.library.getOrLoadArchive(user.url)

From 462427dac182cf03986e7d782016d1e3ea74a01c Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 9 Dec 2018 18:29:47 -0600
Subject: [PATCH 014/245] Fixes

---
 crawler/followgraph.js | 14 +++++++-------
 crawler/index.js       | 19 ++++++++++++-------
 crawler/posts.js       | 43 +++++++++++++++++++++++++-----------------
 crawler/util.js        | 31 +++++++++++++++++-------------
 users/index.js         |  2 ++
 5 files changed, 65 insertions(+), 44 deletions(-)

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index 3d1b9421..8d22d4b1 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -26,15 +26,15 @@ exports.on = events.on.bind(events)
 exports.addListener = events.addListener.bind(events)
 exports.removeListener = events.removeListener.bind(events)
 
-exports.crawlSite = async function (archive, crawlSourceId) {
-  return doCrawl(archive, crawlSourceId, 'crawl_followgraph', TABLE_VERSION, async ({changes, resetRequired}) => {
+exports.crawlSite = async function (archive, crawlSource) {
+  return doCrawl(archive, crawlSource, 'crawl_followgraph', TABLE_VERSION, async ({changes, resetRequired}) => {
     const supressEvents = resetRequired === true // dont emit when replaying old info
     if (resetRequired) {
       // reset all data
       await db.run(`
         DELETE FROM crawl_followgraph WHERE crawlSourceId = ?
-      `, [crawlSourceId])
-      await doCheckpoint('crawl_followgraph', TABLE_VERSION, crawlSourceId, 0)
+      `, [crawlSource.id])
+      await doCheckpoint('crawl_followgraph', TABLE_VERSION, crawlSource, 0)
     }
 
     // did follows.json change?
@@ -61,7 +61,7 @@ exports.crawlSite = async function (archive, crawlSourceId) {
     for (let add of adds) {
       await db.run(`
         INSERT INTO crawl_followgraph (crawlSourceId, destUrl, crawledAt) VALUES (?, ?, ?)
-      `, [crawlSourceId, add, Date.now()])
+      `, [crawlSource.id, add, Date.now()])
       if (!supressEvents) {
         events.emit('follow-added', archive.url, add)
       }
@@ -69,14 +69,14 @@ exports.crawlSite = async function (archive, crawlSourceId) {
     for (let remove of removes) {
       await db.run(`
         DELETE FROM crawl_followgraph WHERE crawlSourceId = ? AND destUrl = ?
-      `, [crawlSourceId, remove])
+      `, [crawlSource.id, remove])
       if (supressEvents) {
         events.emit('follow-removed', archive.url, remove)
       }
     }
 
     // write checkpoint as success
-    await doCheckpoint('crawl_followgraph', TABLE_VERSION, crawlSourceId, changes[changes.length - 1].version)
+    await doCheckpoint('crawl_followgraph', TABLE_VERSION, crawlSource, changes[changes.length - 1].version)
   })
 }
 
diff --git a/crawler/index.js b/crawler/index.js
index 2e20e7bb..004607a3 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -23,15 +23,19 @@ exports.setup = async function () {
 
 exports.watchSite = async function (archive) {
   if (typeof archive === 'string') {
-    archive = await dat.library.getOrLoadArchive()
+    archive = await dat.library.getOrLoadArchive(archive)
   }
+  console.log('watchSite', archive.url)
 
   if (!(archive.url in watches)) {
     const queueCrawl = _throttle(() => crawlSite(archive), 5e3)
 
     // watch for file changes
-    watches[archive.url] = archive.pda.watch()
+    watches[archive.url] = await archive.pda.watch()
+    watches[archive.url].on('error', console.error)
+    watches[archive.url].on('close', console.log.bind(console, 'close'))
     watches[archive.url].on('data', ([event, args]) => {
+      console.log('change event', archive.url, event, args)
       if (event === 'invalidated') {
         queueCrawl()
       }
@@ -51,19 +55,20 @@ exports.unwatchSite = async function (url) {
 }
 
 async function crawlSite (archive) {
+  console.log('crawling', archive.url)
   var release = await lock('crawl:' + archive.url)
   try {
     // get/create crawl source
-    var crawlSourceId = await db.run(`SELECT id FROM crawl_sources WHERE url = ?`, [archive.url])
-    if (!crawlSourceId) {
+    var crawlSource = await db.get(`SELECT id FROM crawl_sources WHERE url = ?`, [archive.url])
+    if (!crawlSource) {
       await db.run(`INSERT INTO crawl_sources (url) VALUES (?)`, [archive.url])
-      crawlSourceId = db.getSqliteInstance().lastID
+      crawlSource = {id: db.getSqliteInstance().lastID, url: archive.url}
     }
 
     // crawl individual sources
     await Promise.all([
-      posts.crawlSite(archive, crawlSourceId),
-      followgraph.crawlSite(archive, crawlSourceId)
+      posts.crawlSite(archive, crawlSource),
+      followgraph.crawlSite(archive, crawlSource)
     ])
   } finally {
     release()
diff --git a/crawler/posts.js b/crawler/posts.js
index dc797c9a..eda18370 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -24,28 +24,31 @@ exports.on = events.on.bind(events)
 exports.addListener = events.addListener.bind(events)
 exports.removeListener = events.removeListener.bind(events)
 
-exports.crawlSite = async function (archive, crawlSourceId) {
-  return doCrawl(archive, crawlSourceId, 'crawl_posts', TABLE_VERSION, async ({changes, resetRequired}) => {
+exports.crawlSite = async function (archive, crawlSource) {
+  return doCrawl(archive, crawlSource, 'crawl_posts', TABLE_VERSION, async ({changes, resetRequired}) => {
     const supressEvents = resetRequired === true // dont emit when replaying old info
+    console.log('Crawling posts for', archive.url, {changes, resetRequired})
     if (resetRequired) {
       // reset all data
+      console.log('resetting data')
       await db.run(`
         DELETE FROM crawl_posts WHERE crawlSourceId = ?
-      `, [crawlSourceId])
-      await doCheckpoint('crawl_posts', TABLE_VERSION, crawlSourceId, 0)
+      `, [crawlSource.id])
+      await doCheckpoint('crawl_posts', TABLE_VERSION, crawlSource, 0)
     }
 
     // collect changed posts
     var changedPosts = [] // order matters, must be oldest to newest
     changes.forEach(c => {
-      if (JSON_PATH_REGEX.test(c.path)) {
-        let i = changedPosts.findIndex(c2 => c2.path === c.path)
-        if (i) {
+      if (JSON_PATH_REGEX.test(c.name)) {
+        let i = changedPosts.findIndex(c2 => c2.name === c.name)
+        if (i !== -1) {
           changedPosts.splice(i, 1) // remove from old position
         }
         changedPosts.push(c)
       }
     })
+    console.log('collected changed posts', changedPosts)
 
     // read and apply each post in order
     for (let changedPost of changedPosts) {
@@ -55,22 +58,24 @@ exports.crawlSite = async function (archive, crawlSourceId) {
       //      -prf
       if (changedPost.type === 'del') {
         // delete
+        console.log('deleting', changedPost)
         await db.run(`
           DELETE FROM crawl_posts WHERE crawlSourceId = ? AND pathname = ?
-        `, [crawlSourceId, changedPost.path])
+        `, [crawlSource.id, changedPost.name])
         events.emit('post-removed', archive.url)
       } else {
         // read and validate
+        console.log('adding', changedPost)
         let post
         try {
-          post = JSON.parse(await archive.pda.readFile(changedPost.path, 'utf8'))
+          post = JSON.parse(await archive.pda.readFile(changedPost.name, 'utf8'))
           assert(typeof post === 'object', 'File be an object')
           assert(post.type === 'unwalled.garden/post', 'JSON type must be unwalled.garden/post')
           assert(typeof post.content === 'string', 'JSON content must be a string')
           assert(typeof post.createdAt === 'string', 'JSON createdAt must be a date-time')
           assert(!isNaN(Number(new Date(post.createdAt))), 'JSON createdAt must be a date-time')
         } catch (err) {
-          debug('Failed to read post file', {url: archive.url, path: changedPost.path, err})
+          debug('Failed to read post file', {url: archive.url, name: changedPost.name, err})
           return // abort indexing
         }
 
@@ -80,25 +85,26 @@ exports.crawlSite = async function (archive, crawlSourceId) {
         if (isNaN(post.updatedAt)) post.updatedAt = 0 // value is optional
 
         // upsert
-        let existingPost = await get(archive.url, changedPost.path)
+        let existingPost = await get(archive.url, changedPost.name)
         if (existingPost) {
           await db.run(`
             UPDATE crawl_posts
               SET crawledAt = ?, content = ?, createdAt = ?, updatedAt = ?
               WHERE crawlSourceId = ? AND pathname = ?
-          `, [Date.now(), post.content, post.createdAt, post.updatedAt, crawlSourceId, changedPost.path])
+          `, [Date.now(), post.content, post.createdAt, post.updatedAt, crawlSource.id, changedPost.name])
           events.emit('post-updated', archive.url)
         } else {
           await db.run(`
             INSERT INTO crawl_posts (crawlSourceId, pathname, crawledAt, content, createdAt, updatedAt)
               VALUES (?, ?, ?, ?, ?, ?)
-          `, [crawlSourceId, changedPost.path, Date.now(), post.content, post.createdAt, post.updatedAt])
+          `, [crawlSource.id, changedPost.name, Date.now(), post.content, post.createdAt, post.updatedAt])
           events.emit('post-added', archive.url)
         }
 
         // checkpoint our progress
-        await doCheckpoint('crawl_posts', TABLE_VERSION, crawlSourceId, changedPost.version)
+        await doCheckpoint('crawl_posts', TABLE_VERSION, crawlSource, changedPost.version)
       }
+      console.log('success', changedPost)
     }
   })
 }
@@ -115,10 +121,13 @@ exports.list = async function ({offset, limit, reverse, author} = {}) {
   }
 
   // build query
-  var query = `SELECT crawl_posts.*, src.url AS crawlSourceUrl FROM crawl_posts`
+  var query = `
+    SELECT crawl_posts.*, src.url AS crawlSourceUrl FROM crawl_posts
+      INNER JOIN crawl_sources src ON src.id = crawl_posts.crawlSourceId
+  `
   var values = []
   if (author) {
-    query += ` INNER JOIN crawl_sources src ON src.url = ?`
+    query += ` WHERE src.url = ?`
     values.push(author.origin)
   }
   if (offset) {
@@ -162,7 +171,7 @@ const get = exports.get = async function (url, pathname = undefined) {
 exports.create = async function (archive, {content} = {}) {
   assert(typeof content === 'string', 'Create() must be provided a `content` string')
   var filename = generateTimeFilename()
-  await archive.writeFile(`/posts/${filename}.json`, JSON.stringify({
+  await archive.writeFile(`/data/posts/${filename}.json`, JSON.stringify({
     type: JSON_TYPE,
     content,
     createdAt: (new Date()).toISOString()
diff --git a/crawler/util.js b/crawler/util.js
index 60daffaa..cdb0e001 100644
--- a/crawler/util.js
+++ b/crawler/util.js
@@ -1,24 +1,26 @@
+const pump = require('pump')
+const concat = require('concat-stream')
 const db = require('../dbs/profile-data-db')
 const dat = require('../dat')
 
 const READ_TIMEOUT = 30e3
 
-exports.doCrawl = async function (archive, crawlSourceId, crawlDataset, crawlDatasetVersion, handlerFn) {
+exports.doCrawl = async function (archive, crawlSource, crawlDataset, crawlDatasetVersion, handlerFn) {
   const url = archive.url
 
   // fetch current crawl state
   var resetRequired = false
   var state = await db.get(`
-    SELECT crawl_sources_meta.crawlSourceVersion FROM crawl_sources_meta
+    SELECT meta.crawlSourceVersion, meta.crawlDatasetVersion FROM crawl_sources_meta meta
       INNER JOIN crawl_sources ON crawl_sources.url = ?
-      WHERE crawl_sources_meta.crawlDataset = ?
+      WHERE meta.crawlDataset = ?
   `, [url, crawlDataset])
   if (state && state.crawlDatasetVersion !== crawlDatasetVersion) {
     resetRequired = true
     state = null
   }
   if (!state) {
-    state = {crawlSourceVersion: 0}
+    state = {crawlSourceVersion: 0, crawlDatasetVersion}
   }
 
   // fetch current archive version
@@ -26,25 +28,28 @@ exports.doCrawl = async function (archive, crawlSourceId, crawlDataset, crawlDat
   var version = archiveInfo ? archiveInfo.version : 0
 
   // fetch change log
-  var start = state.crawlSourceVersion
-  var end = version
+  var start = state.crawlSourceVersion + 1
+  var end = version + 1
+  console.log('fetching changes', start, end, state)
   var changes = await new Promise((resolve, reject) => {
-    archive.history({start, end, timeout: READ_TIMEOUT}, (err, c) => {
-      if (err) reject(err)
-      else resolve(c)
-    })
+    pump(
+      archive.history({start, end, timeout: READ_TIMEOUT}),
+      concat({encoding: 'object'}, resolve),
+      reject
+    )
   })
 
   // handle changes
   await handlerFn({changes, resetRequired})
 }
 
-exports.doCheckpoint = async function (crawlDataset, crawlDatasetVersion, crawlSourceId, crawlSourceVersion) {
+exports.doCheckpoint = async function (crawlDataset, crawlDatasetVersion, crawlSource, crawlSourceVersion) {
+  await db.run(`DELETE FROM crawl_sources_meta WHERE crawlDataset = ? AND crawlSourceId = ?`, [crawlDataset, crawlSource.id])
   await db.run(`
-    INSERT OR REPLACE
+    INSERT
       INTO crawl_sources_meta (crawlDataset, crawlDatasetVersion, crawlSourceId, crawlSourceVersion, updatedAt)
       VALUES (?, ?, ?, ?, ?)
-  `, [crawlDataset, crawlDatasetVersion, crawlSourceId, crawlSourceVersion, Date.now()])
+  `, [crawlDataset, crawlDatasetVersion, crawlSource.id, crawlSourceVersion, Date.now()])
 }
 
 var _lastGeneratedTimeFilename
diff --git a/users/index.js b/users/index.js
index e31b3024..2d05298b 100644
--- a/users/index.js
+++ b/users/index.js
@@ -30,6 +30,7 @@ exports.setup = async function () {
 
   // load the current users
   users = await db.all(`SELECT * FROM users`)
+  console.log('users loaded', users)
   users.forEach(async (user) => {
     // massage data
     user.archive = null
@@ -81,6 +82,7 @@ exports.add = async function (url) {
     isDefault: users.length === 0,
     createdAt: Date.now()
   }
+  console.log('adding new user', user)
   await db.run(
     `INSERT INTO users (url, isDefault, createdAt) VALUES (?, ?, ?)`,
     [user.url, Number(user.isDefault), user.createdAt]

From a79a5f600e7b0bfc76a3037b0a315835e43f25a1 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 9 Dec 2018 20:05:32 -0600
Subject: [PATCH 015/245] Crawler fixes, particularly around the changes
 watcher

---
 crawler/followgraph.js |  6 +++++-
 crawler/index.js       | 17 ++++++++++++-----
 crawler/posts.js       | 18 ++++++++++--------
 crawler/util.js        |  2 +-
 4 files changed, 28 insertions(+), 15 deletions(-)

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index 8d22d4b1..3ec2a7f5 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -4,6 +4,7 @@ const Events = require('events')
 const {Url} = require('url')
 const lock = require('../lib/lock')
 const db = require('../dbs/profile-data-db')
+const crawler = require('./index')
 const {doCrawl, doCheckpoint} = require('./util')
 const debug = require('../lib/debug-logger').debugLogger('crawler')
 
@@ -193,7 +194,10 @@ async function updateFollowsFile (archive, updateFn) {
     updateFn(followsJson)
 
     // write the follows file
-    await archive.pda.readFile(JSON_PATH, JSON.stringify(followsJson), 'utf8')
+    await archive.pda.writeFile(JSON_PATH, JSON.stringify(followsJson), 'utf8')
+
+    // trigger crawl now
+    await crawler.crawlSite(archive)
   } finally {
     release()
   }
diff --git a/crawler/index.js b/crawler/index.js
index 004607a3..586c1c0a 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -7,6 +7,8 @@ const dat = require('../dat')
 const posts = require('./posts')
 const followgraph = require('./followgraph')
 
+const CRAWL_POLL_INTERVAL = 30e3
+
 // globals
 // =
 
@@ -31,16 +33,20 @@ exports.watchSite = async function (archive) {
     const queueCrawl = _throttle(() => crawlSite(archive), 5e3)
 
     // watch for file changes
-    watches[archive.url] = await archive.pda.watch()
-    watches[archive.url].on('error', console.error)
-    watches[archive.url].on('close', console.log.bind(console, 'close'))
+    watches[archive.url] = archive.pda.watch()
     watches[archive.url].on('data', ([event, args]) => {
-      console.log('change event', archive.url, event, args)
+      console.log('MIRACLE ALERT! The crawler watch stream emitted a change event', archive.url, event, args)
       if (event === 'invalidated') {
         queueCrawl()
       }
     })
 
+    // HACK
+    // for reasons that currently surpass me
+    // the `archive.pda.watch()` call is not currently working all the time
+    // so we need to poll sites for now
+    setInterval(queueCrawl, CRAWL_POLL_INTERVAL)
+
     // run the first crawl
     crawlSite(archive)
   }
@@ -54,7 +60,8 @@ exports.unwatchSite = async function (url) {
   }
 }
 
-async function crawlSite (archive) {
+const crawlSite =
+exports.crawlSite = async function (archive) {
   console.log('crawling', archive.url)
   var release = await lock('crawl:' + archive.url)
   try {
diff --git a/crawler/posts.js b/crawler/posts.js
index eda18370..4401c2ee 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -2,6 +2,7 @@ const assert = require('assert')
 const {URL} = require('url')
 const Events = require('events')
 const db = require('../dbs/profile-data-db')
+const crawler = require('./index')
 const {doCrawl, doCheckpoint, generateTimeFilename} = require('./util')
 const debug = require('../lib/debug-logger').debugLogger('crawler')
 
@@ -30,7 +31,6 @@ exports.crawlSite = async function (archive, crawlSource) {
     console.log('Crawling posts for', archive.url, {changes, resetRequired})
     if (resetRequired) {
       // reset all data
-      console.log('resetting data')
       await db.run(`
         DELETE FROM crawl_posts WHERE crawlSourceId = ?
       `, [crawlSource.id])
@@ -58,14 +58,12 @@ exports.crawlSite = async function (archive, crawlSource) {
       //      -prf
       if (changedPost.type === 'del') {
         // delete
-        console.log('deleting', changedPost)
         await db.run(`
           DELETE FROM crawl_posts WHERE crawlSourceId = ? AND pathname = ?
         `, [crawlSource.id, changedPost.name])
         events.emit('post-removed', archive.url)
       } else {
         // read and validate
-        console.log('adding', changedPost)
         let post
         try {
           post = JSON.parse(await archive.pda.readFile(changedPost.name, 'utf8'))
@@ -104,7 +102,6 @@ exports.crawlSite = async function (archive, crawlSource) {
         // checkpoint our progress
         await doCheckpoint('crawl_posts', TABLE_VERSION, crawlSource, changedPost.version)
       }
-      console.log('success', changedPost)
     }
   })
 }
@@ -171,26 +168,31 @@ const get = exports.get = async function (url, pathname = undefined) {
 exports.create = async function (archive, {content} = {}) {
   assert(typeof content === 'string', 'Create() must be provided a `content` string')
   var filename = generateTimeFilename()
-  await archive.writeFile(`/data/posts/${filename}.json`, JSON.stringify({
+  console.log('writing file')
+  await archive.pda.writeFile(`/data/posts/${filename}.json`, JSON.stringify({
     type: JSON_TYPE,
     content,
     createdAt: (new Date()).toISOString()
   }))
+  console.log('file written')
+  await crawler.crawlSite(archive)
 }
 
 exports.edit = async function (archive, pathname, {content} = {}) {
   assert(typeof pathname === 'string', 'Edit() must be provided a valid URL string')
   assert(typeof content === 'string', 'Edit() must be provided a `content` string')
-  var oldJson = JSON.parse(await archive.readFile(pathname))
-  await archive.writeFile(pathname, JSON.stringify({
+  var oldJson = JSON.parse(await archive.pda.readFile(pathname))
+  await archive.pda.writeFile(pathname, JSON.stringify({
     type: JSON_TYPE,
     content,
     createdAt: oldJson.createdAt,
     updatedAt: (new Date()).toISOString()
   }))
+  await crawler.crawlSite(archive)
 }
 
 exports.delete = async function (archive, pathname) {
   assert(typeof pathname === 'string', 'Delete() must be provided a valid URL string')
-  await archive.unlink(pathname)
+  await archive.pda.unlink(pathname)
+  await crawler.crawlSite(archive)
 }
diff --git a/crawler/util.js b/crawler/util.js
index cdb0e001..f16c018f 100644
--- a/crawler/util.js
+++ b/crawler/util.js
@@ -30,7 +30,7 @@ exports.doCrawl = async function (archive, crawlSource, crawlDataset, crawlDatas
   // fetch change log
   var start = state.crawlSourceVersion + 1
   var end = version + 1
-  console.log('fetching changes', start, end, state)
+  console.log('fetching changes', archive.url, start, end, state)
   var changes = await new Promise((resolve, reject) => {
     pump(
       archive.history({start, end, timeout: READ_TIMEOUT}),

From c08bcc36f4b951d05fdfd2ffdf6dbd18e6804e6e Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 9 Dec 2018 20:21:43 -0600
Subject: [PATCH 016/245] Give better author info in posts responses

---
 crawler/posts.js     | 18 +++++++++++++-----
 web-apis/bg/posts.js | 19 +++++++++++++++++--
 2 files changed, 30 insertions(+), 7 deletions(-)

diff --git a/crawler/posts.js b/crawler/posts.js
index 4401c2ee..b7235412 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -141,7 +141,7 @@ exports.list = async function ({offset, limit, reverse, author} = {}) {
   }
 
   // execute query
-  return db.all(query, values)
+  return (await db.all(query, values)).map(massagePostRow)
 }
 
 const get = exports.get = async function (url, pathname = undefined) {
@@ -153,7 +153,7 @@ const get = exports.get = async function (url, pathname = undefined) {
   pathname = pathname || url.pathname
 
   // execute query
-  return db.get(`
+  return massagePostRow(await db.get(`
     SELECT
         crawl_posts.*, src.url AS crawlSourceUrl
       FROM crawl_posts
@@ -162,19 +162,17 @@ const get = exports.get = async function (url, pathname = undefined) {
         AND src.url = ?
       WHERE
         crawl_posts.pathname = ?
-  `, [url.origin, pathname])
+  `, [url.origin, pathname]))
 }
 
 exports.create = async function (archive, {content} = {}) {
   assert(typeof content === 'string', 'Create() must be provided a `content` string')
   var filename = generateTimeFilename()
-  console.log('writing file')
   await archive.pda.writeFile(`/data/posts/${filename}.json`, JSON.stringify({
     type: JSON_TYPE,
     content,
     createdAt: (new Date()).toISOString()
   }))
-  console.log('file written')
   await crawler.crawlSite(archive)
 }
 
@@ -196,3 +194,13 @@ exports.delete = async function (archive, pathname) {
   await archive.pda.unlink(pathname)
   await crawler.crawlSite(archive)
 }
+
+// internal methods
+// =
+
+function massagePostRow (row) {
+  row.author = {url: row.crawlSourceUrl}
+  delete row.crawlSourceUrl
+  delete row.crawlSourceId
+  return row
+}
diff --git a/web-apis/bg/posts.js b/web-apis/bg/posts.js
index d7c5e623..02213262 100644
--- a/web-apis/bg/posts.js
+++ b/web-apis/bg/posts.js
@@ -3,6 +3,7 @@ const assert = require('assert')
 const {Url} = require('url')
 const {PermissionsError} = require('beaker-error-constants')
 const dat = require('../../dat')
+const archivesDb = require('../../dbs/archives')
 const postsCrawler = require('../../crawler/posts')
 
 // exported api
@@ -20,11 +21,17 @@ module.exports = {
       try { author = new URL(author) }
       catch (e) { throw new Error('Failed to parse author URL: ' + author) }
     }
-    return postsCrawler.list({offset, limit, reverse, author})
+    var posts = await postsCrawler.list({offset, limit, reverse, author})
+    await Promise.all(posts.map(async (post) => {
+      post.author.title = await getUserTitle(post.author)
+    }))
+    return posts
   },
 
   async get (origin, pathname = undefined) {
-    return postsCrawler.get(origin, pathname)
+    var post = await postsCrawler.get(origin, pathname)
+    post.author.title = await getUserTitle(post.author)
+    return post
   },
 
   async create ({content} = {}) {
@@ -51,4 +58,12 @@ module.exports = {
     var userArchive = dat.library.getArchive(userSession.url)
     return postsCrawler.delete(userArchive, pathname)
   }
+}
+
+// internal methods
+// =
+
+async function getUserTitle (author) {
+  var meta = await archivesDb.getMeta(author.url.slice('dat://'.length))
+  return meta ? meta.title : false
 }
\ No newline at end of file

From fc8a52a4e40a7b54b51d2903c5b7adadfaab5950 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 9 Dec 2018 20:30:22 -0600
Subject: [PATCH 017/245] Correctly handle get() that doesnt have content

---
 crawler/posts.js | 1 +
 1 file changed, 1 insertion(+)

diff --git a/crawler/posts.js b/crawler/posts.js
index b7235412..40f63e4c 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -199,6 +199,7 @@ exports.delete = async function (archive, pathname) {
 // =
 
 function massagePostRow (row) {
+  if (!row) return null
   row.author = {url: row.crawlSourceUrl}
   delete row.crawlSourceUrl
   delete row.crawlSourceId

From 6252f9bced15e1fd2fe8e45b5291f30d8bdc1ff6 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 9 Dec 2018 20:40:48 -0600
Subject: [PATCH 018/245] Normalize the URL provided by the users api

---
 users/index.js | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/users/index.js b/users/index.js
index 2d05298b..3d672a84 100644
--- a/users/index.js
+++ b/users/index.js
@@ -164,7 +164,7 @@ async function fetchUserInfo (user) {
   var urlp = new URL(user.url)
   var meta = await archivesDb.getMeta(urlp.hostname)
   return {
-    url: user.url,
+    url: user.url.replace(/(\/)$/, ''),
     isDefault: user.isDefault,
     title: meta.title,
     description: meta.description,

From 85c9f3c61997ce707449d8638e20cca5d5512955 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 9 Dec 2018 20:45:38 -0600
Subject: [PATCH 019/245] More consistent URL normalization

---
 users/index.js | 13 +++++++++++--
 1 file changed, 11 insertions(+), 2 deletions(-)

diff --git a/users/index.js b/users/index.js
index 3d672a84..9f66b19c 100644
--- a/users/index.js
+++ b/users/index.js
@@ -33,6 +33,7 @@ exports.setup = async function () {
   console.log('users loaded', users)
   users.forEach(async (user) => {
     // massage data
+    user.url = normalizeUrl(user.url)
     user.archive = null
     user.isDefault = Boolean(user.isDefault)
     user.createdAt = new Date(user.createdAt)
@@ -55,13 +56,15 @@ exports.list = async function () {
 
 const get =
 exports.get = async function (url) {
+  url = normalizeUrl(url)
+  console.log('getting user', url, users)
   var user = users.find(user => user.url === url)
   if (!user) return null
   return await fetchUserInfo(user)
 }
 
 const getDefault =
-exports.getDefault = async function (url = undefined) {
+exports.getDefault = async function () {
   var user = users.find(user => user.isDefault === true)
   if (!user) return null
   return await fetchUserInfo(user)
@@ -69,6 +72,7 @@ exports.getDefault = async function (url = undefined) {
 
 exports.add = async function (url) {
   // make sure the user doesnt already exist
+  url = normalizeUrl(url)
   var existingUser = await get(url)
   if (existingUser) return
 
@@ -96,6 +100,7 @@ exports.add = async function (url) {
 }
 
 exports.remove = async function (url) {
+  url = normalizeUrl(url)
   // get the user
   var user = await get(url)
   if (!user) return
@@ -164,7 +169,7 @@ async function fetchUserInfo (user) {
   var urlp = new URL(user.url)
   var meta = await archivesDb.getMeta(urlp.hostname)
   return {
-    url: user.url.replace(/(\/)$/, ''),
+    url: normalizeUrl(user.url),
     isDefault: user.isDefault,
     title: meta.title,
     description: meta.description,
@@ -172,6 +177,10 @@ async function fetchUserInfo (user) {
   }
 }
 
+function normalizeUrl (url) {
+  return url ? url.replace(/(\/)$/, '') : url
+}
+
 async function validateUserUrl (url) {
   // make sure the archive is saved and that we own the archive
   var urlp = new URL(url)

From b23ef93235dc6d0953425e5cfc1404042b46937c Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 9 Dec 2018 20:53:05 -0600
Subject: [PATCH 020/245] Create folders as needed

---
 crawler/posts.js | 7 +++++++
 users/index.js   | 1 -
 2 files changed, 7 insertions(+), 1 deletion(-)

diff --git a/crawler/posts.js b/crawler/posts.js
index 40f63e4c..b516d149 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -168,6 +168,8 @@ const get = exports.get = async function (url, pathname = undefined) {
 exports.create = async function (archive, {content} = {}) {
   assert(typeof content === 'string', 'Create() must be provided a `content` string')
   var filename = generateTimeFilename()
+  await ensureDirectory(archive, '/data')
+  await ensureDirectory(archive, '/data/posts')
   await archive.pda.writeFile(`/data/posts/${filename}.json`, JSON.stringify({
     type: JSON_TYPE,
     content,
@@ -198,6 +200,11 @@ exports.delete = async function (archive, pathname) {
 // internal methods
 // =
 
+async function ensureDirectory (archive, pathname) {
+  try { await archive.pda.mkdir(pathname) }
+  catch (e) { /* ignore */ }
+}
+
 function massagePostRow (row) {
   if (!row) return null
   row.author = {url: row.crawlSourceUrl}
diff --git a/users/index.js b/users/index.js
index 9f66b19c..b8e00e7f 100644
--- a/users/index.js
+++ b/users/index.js
@@ -57,7 +57,6 @@ exports.list = async function () {
 const get =
 exports.get = async function (url) {
   url = normalizeUrl(url)
-  console.log('getting user', url, users)
   var user = users.find(user => user.url === url)
   if (!user) return null
   return await fetchUserInfo(user)

From e9b33ba46a8dc3f7c3c0e7d8fca98d0c5656cae1 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 10 Dec 2018 11:46:46 -0600
Subject: [PATCH 021/245] Fixes

---
 crawler/followgraph.js     | 2 +-
 web-apis/bg/followgraph.js | 9 ++++-----
 2 files changed, 5 insertions(+), 6 deletions(-)

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index 3ec2a7f5..12b1dfa6 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -156,7 +156,7 @@ exports.unfollow = function (archive, followUrl) {
 function normalizeFollowUrl (url) {
   try {
     url = new URL(url)
-    return url.origin
+    return url.protocol + '//' + url.hostname
   } catch (e) {
     return null
   }
diff --git a/web-apis/bg/followgraph.js b/web-apis/bg/followgraph.js
index 3ac7c14b..4fee199d 100644
--- a/web-apis/bg/followgraph.js
+++ b/web-apis/bg/followgraph.js
@@ -45,7 +45,7 @@ module.exports = {
     var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
     var userArchive = dat.library.getArchive(userSession.url)
-    return followgraphCrawler.follow(userArchive, url)
+    return followgraphCrawler.unfollow(userArchive, url)
   }
 }
 
@@ -55,10 +55,9 @@ module.exports = {
 function normalizeFollowUrl (url) {
   try {
     url = new URL(url)
-    return url.origin
-  } catch (e) {
-    return null
-  }
+    return url.protocol + '//' + url.hostname
+  } catch (e) {}
+  return null
 }
 
 function assertString (v, msg) {

From bc4bbbbe33128a1e5575a44f695e2140efe7feb9 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 10 Dec 2018 12:10:35 -0600
Subject: [PATCH 022/245] Fixes to followgraph crawler

---
 crawler/followgraph.js | 18 +++++++++++++-----
 1 file changed, 13 insertions(+), 5 deletions(-)

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index 12b1dfa6..87bf7d59 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -30,6 +30,7 @@ exports.removeListener = events.removeListener.bind(events)
 exports.crawlSite = async function (archive, crawlSource) {
   return doCrawl(archive, crawlSource, 'crawl_followgraph', TABLE_VERSION, async ({changes, resetRequired}) => {
     const supressEvents = resetRequired === true // dont emit when replaying old info
+    console.log('Crawling follows for', archive.url, {changes, resetRequired})
     if (resetRequired) {
       // reset all data
       await db.run(`
@@ -39,7 +40,7 @@ exports.crawlSite = async function (archive, crawlSource) {
     }
 
     // did follows.json change?
-    var change = changes.find(c => c.path === JSON_PATH)
+    var change = changes.find(c => c.name === JSON_PATH)
     if (!change) {
       return
     }
@@ -48,12 +49,13 @@ exports.crawlSite = async function (archive, crawlSource) {
     try {
       var followsJson = await readFollowsFile(archive)
     } catch (err) {
+      console.error('Failed to read follows file', {url: archive.url, err})
       debug('Failed to read follows file', {url: archive.url, err})
       return
     }
 
     // diff against the current follows
-    var currentFollows = await listFollows(archive)
+    var currentFollows = await listFollows(archive.url)
     var newFollows = followsJson.urls
     var adds = _difference(newFollows, currentFollows)
     var removes = _difference(currentFollows, newFollows)
@@ -163,11 +165,17 @@ function normalizeFollowUrl (url) {
 }
 
 async function readFollowsFile (archive) {
-  var followsJson = JSON.parse(await archive.pda.readFile(JSON_PATH, 'utf8'))
+  try {
+    var followsJson = await archive.pda.readFile(JSON_PATH, 'utf8')
+  } catch (e) {
+    if (e.notFound) return {urls: []} // empty default when not found
+    throw e
+  }
+  followsJson = JSON.parse(followsJson)
   assert(typeof followsJson === 'object', 'File be an object')
   assert(followsJson.type === JSON_TYPE, 'JSON type must be unwalled.garden/follows')
-  assert(Array.isArray(followsJson.follows), 'JSON follows must be an array of strings')
-  followsJson.follows = followsJson.follows.filter(v => typeof v === 'string')
+  assert(Array.isArray(followsJson.urls), 'JSON .urls must be an array of strings')
+  followsJson.urls = followsJson.urls.filter(v => typeof v === 'string')
   return followsJson
 }
 

From 3495ba1e552be6434a084996a93a6b4b6f7acb18 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 10 Dec 2018 12:11:11 -0600
Subject: [PATCH 023/245] Fixes to crawler

---
 crawler/index.js | 2 +-
 crawler/util.js  | 7 +++----
 2 files changed, 4 insertions(+), 5 deletions(-)

diff --git a/crawler/index.js b/crawler/index.js
index 586c1c0a..1112ac64 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -66,7 +66,7 @@ exports.crawlSite = async function (archive) {
   var release = await lock('crawl:' + archive.url)
   try {
     // get/create crawl source
-    var crawlSource = await db.get(`SELECT id FROM crawl_sources WHERE url = ?`, [archive.url])
+    var crawlSource = await db.get(`SELECT id, url FROM crawl_sources WHERE url = ?`, [archive.url])
     if (!crawlSource) {
       await db.run(`INSERT INTO crawl_sources (url) VALUES (?)`, [archive.url])
       crawlSource = {id: db.getSqliteInstance().lastID, url: archive.url}
diff --git a/crawler/util.js b/crawler/util.js
index f16c018f..02c008dc 100644
--- a/crawler/util.js
+++ b/crawler/util.js
@@ -11,10 +11,9 @@ exports.doCrawl = async function (archive, crawlSource, crawlDataset, crawlDatas
   // fetch current crawl state
   var resetRequired = false
   var state = await db.get(`
-    SELECT meta.crawlSourceVersion, meta.crawlDatasetVersion FROM crawl_sources_meta meta
-      INNER JOIN crawl_sources ON crawl_sources.url = ?
-      WHERE meta.crawlDataset = ?
-  `, [url, crawlDataset])
+    SELECT crawlSourceVersion, crawlDatasetVersion FROM crawl_sources_meta
+      WHERE crawlSourceId = ? AND crawlDataset = ?
+  `, [crawlSource.id, crawlDataset])
   if (state && state.crawlDatasetVersion !== crawlDatasetVersion) {
     resetRequired = true
     state = null

From 6b6dab7a8e416da28da2ede5d4db316815cfe227 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 10 Dec 2018 12:33:32 -0600
Subject: [PATCH 024/245] Add authors param to beaker.posts.list

---
 crawler/posts.js                     | 26 ++++++++++++++++++++++----
 web-apis/bg/posts.js                 |  9 +++------
 web-apis/manifests/internal/users.js |  7 +++++++
 3 files changed, 32 insertions(+), 10 deletions(-)
 create mode 100644 web-apis/manifests/internal/users.js

diff --git a/crawler/posts.js b/crawler/posts.js
index b516d149..dc4c8f1f 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -106,15 +106,21 @@ exports.crawlSite = async function (archive, crawlSource) {
   })
 }
 
-exports.list = async function ({offset, limit, reverse, author} = {}) {
+exports.list = async function ({offset, limit, reverse, author, authors} = {}) {
   // validate & parse params
   assert(!offset || typeof offset === 'number', 'Offset must be a number')
   assert(!limit || typeof limit === 'number', 'Limit must be a number')
   assert(!reverse || typeof reverse === 'boolean', 'Reverse must be a boolean')
   assert(!author || typeof author === 'string', 'Author must be a string')
+  assert(!authors || !Array.isArray(author), 'Authors must be an array of strings')
+
   if (author) {
-    try { author = new URL(author) }
-    catch (e) { throw new Error('Failed to parse author URL: ' + author) }
+    try { author = toOrigin(author) }
+    catch (e) { throw new Error('Author must be a valid URL') }
+  }
+  if (authors) {
+    try { authors = authors.map(toOrigin) }
+    catch (e) { throw new Error('Authors array must contain valid URLs') }
   }
 
   // build query
@@ -125,7 +131,14 @@ exports.list = async function ({offset, limit, reverse, author} = {}) {
   var values = []
   if (author) {
     query += ` WHERE src.url = ?`
-    values.push(author.origin)
+    values.push(author)
+  } else if (authors) {
+    let op = 'WHERE'
+    for (let author of authors) {
+      query += ` ${op} src.url = ?`
+      op = 'OR'
+      values.push(author)
+    }
   }
   if (offset) {
     query += ` OFFSET ?`
@@ -200,6 +213,11 @@ exports.delete = async function (archive, pathname) {
 // internal methods
 // =
 
+function toOrigin (url) {
+  url = new URL(url)
+  return url.protocol + '//' + url.hostname
+}
+
 async function ensureDirectory (archive, pathname) {
   try { await archive.pda.mkdir(pathname) }
   catch (e) { /* ignore */ }
diff --git a/web-apis/bg/posts.js b/web-apis/bg/posts.js
index 02213262..ee3eeca4 100644
--- a/web-apis/bg/posts.js
+++ b/web-apis/bg/posts.js
@@ -11,17 +11,14 @@ const postsCrawler = require('../../crawler/posts')
 
 module.exports = {
 
-  async list ({offset, limit, reverse, author} = {}) {
+  async list ({offset, limit, reverse, author, authors} = {}) {
     // validate & parse params
     assert(!offset || typeof offset === 'number', 'Offset must be a number')
     assert(!limit || typeof limit === 'number', 'Limit must be a number')
     assert(!reverse || typeof reverse === 'boolean', 'Reverse must be a boolean')
     assert(!author || typeof author === 'string', 'Author must be a string')
-    if (author) {
-      try { author = new URL(author) }
-      catch (e) { throw new Error('Failed to parse author URL: ' + author) }
-    }
-    var posts = await postsCrawler.list({offset, limit, reverse, author})
+    assert(!authors || !Array.isArray(author), 'Authors must be an array of strings')
+    var posts = await postsCrawler.list({offset, limit, reverse, author, authors})
     await Promise.all(posts.map(async (post) => {
       post.author.title = await getUserTitle(post.author)
     }))
diff --git a/web-apis/manifests/internal/users.js b/web-apis/manifests/internal/users.js
new file mode 100644
index 00000000..bdc4add0
--- /dev/null
+++ b/web-apis/manifests/internal/users.js
@@ -0,0 +1,7 @@
+module.exports = {
+  list: 'promise',
+  get: 'promise',
+  getDefault: 'promise',
+  add: 'promise',
+  remove: 'promise'
+}

From 1461a5f447a0ab2ef77583f22114adb3b1b3d7c2 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 10 Dec 2018 12:55:26 -0600
Subject: [PATCH 025/245] More consistent URL normalization in followgraph

---
 crawler/followgraph.js | 14 ++++++++------
 1 file changed, 8 insertions(+), 6 deletions(-)

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index 87bf7d59..b85c3808 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -94,7 +94,7 @@ exports.listFollowers = async function (subject) {
         ON crawl_followgraph.crawlSourceId = crawl_sources.id
         AND crawl_followgraph.destUrl = ?
   `, [subject])
-  return rows.map(row => row.url)
+  return rows.map(row => toOrigin(row.url))
 }
 
 // List urls of sites that subject follows
@@ -108,7 +108,7 @@ const listFollows = exports.listFollows = async function (subject) {
         ON crawl_followgraph.crawlSourceId = crawl_sources.id
         AND crawl_sources.url = ?
   `, [subject])
-  return rows.map(row => row.destUrl)
+  return rows.map(row => toOrigin(row.destUrl))
 }
 
 // Check for the existence of an individual follow
@@ -116,6 +116,8 @@ const listFollows = exports.listFollows = async function (subject) {
 // - b. String (URL), does a follow this site?
 // - returns bool
 exports.isAFollowingB = async function (a, b) {
+  a = toOrigin(a)
+  b = toOrigin(b)
   var res = await db.get(`
     SELECT crawl_sources.id
       FROM crawl_sources
@@ -129,7 +131,7 @@ exports.isAFollowingB = async function (a, b) {
 
 exports.follow = function (archive, followUrl) {
   // normalize followUrl
-  followUrl = normalizeFollowUrl(followUrl)
+  followUrl = toOrigin(followUrl)
   assert(typeof followUrl === 'string', 'Follow() must be given a valid URL')
 
   return updateFollowsFile(archive, followsJson => {
@@ -141,7 +143,7 @@ exports.follow = function (archive, followUrl) {
 
 exports.unfollow = function (archive, followUrl) {
   // normalize followUrl
-  followUrl = normalizeFollowUrl(followUrl)
+  followUrl = toOrigin(followUrl)
   assert(typeof followUrl === 'string', 'Unfollow() must be given a valid URL')
 
   return updateFollowsFile(archive, followsJson => {
@@ -155,7 +157,7 @@ exports.unfollow = function (archive, followUrl) {
 // internal methods
 // =
 
-function normalizeFollowUrl (url) {
+function toOrigin (url) {
   try {
     url = new URL(url)
     return url.protocol + '//' + url.hostname
@@ -175,7 +177,7 @@ async function readFollowsFile (archive) {
   assert(typeof followsJson === 'object', 'File be an object')
   assert(followsJson.type === JSON_TYPE, 'JSON type must be unwalled.garden/follows')
   assert(Array.isArray(followsJson.urls), 'JSON .urls must be an array of strings')
-  followsJson.urls = followsJson.urls.filter(v => typeof v === 'string')
+  followsJson.urls = followsJson.urls.filter(v => typeof v === 'string').map(toOrigin)
   return followsJson
 }
 

From 2848a5241a2897e40425f0b86fa97463556d671d Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 10 Dec 2018 12:55:52 -0600
Subject: [PATCH 026/245] Correctly get last ID of inserts

---
 crawler/index.js       | 4 ++--
 dbs/profile-data-db.js | 5 ++++-
 2 files changed, 6 insertions(+), 3 deletions(-)

diff --git a/crawler/index.js b/crawler/index.js
index 1112ac64..3a7e5c08 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -68,8 +68,8 @@ exports.crawlSite = async function (archive) {
     // get/create crawl source
     var crawlSource = await db.get(`SELECT id, url FROM crawl_sources WHERE url = ?`, [archive.url])
     if (!crawlSource) {
-      await db.run(`INSERT INTO crawl_sources (url) VALUES (?)`, [archive.url])
-      crawlSource = {id: db.getSqliteInstance().lastID, url: archive.url}
+      let res = await db.run(`INSERT INTO crawl_sources (url) VALUES (?)`, [archive.url])
+      crawlSource = {id: res.lastID, url: archive.url}
     }
 
     // crawl individual sources
diff --git a/dbs/profile-data-db.js b/dbs/profile-data-db.js
index ada82a01..a4c919b4 100644
--- a/dbs/profile-data-db.js
+++ b/dbs/profile-data-db.js
@@ -33,7 +33,10 @@ exports.all = async function (...args) {
 
 exports.run = async function (...args) {
   await setupPromise
-  return cbPromise(cb => db.run(...args, cb))
+  return cbPromise(cb => db.run(...args, function (err) {
+    if (err) cb(err)
+    else cb(null, {lastID: this.lastID})
+  }))
 }
 
 exports.serialize = function () {

From b155908cba327e4caf1b78c12c591e47ccec40db Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 10 Dec 2018 16:09:06 -0600
Subject: [PATCH 027/245] Add readFile and showEditProfileModal to
 beaker.browser

---
 web-apis/fg/beaker.js                  | 2 ++
 web-apis/manifests/internal/browser.js | 2 ++
 2 files changed, 4 insertions(+)

diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index b3d4de13..4af45a67 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -73,6 +73,7 @@ exports.setup = function (rpc) {
     beaker.browser.restartBrowser = beakerBrowserRPC.restartBrowser
     beaker.browser.getUserSession = beakerBrowserRPC.getUserSession
     beaker.browser.setUserSession = beakerBrowserRPC.setUserSession
+    beaker.browser.showEditProfileModal = beakerBrowserRPC.showEditProfileModal
     beaker.browser.getSetting = beakerBrowserRPC.getSetting
     beaker.browser.getSettings = beakerBrowserRPC.getSettings
     beaker.browser.setSetting = beakerBrowserRPC.setSetting
@@ -85,6 +86,7 @@ exports.setup = function (rpc) {
     beaker.browser.removeAsDefaultProtocolClient = beakerBrowserRPC.removeAsDefaultProtocolClient
     beaker.browser.fetchBody = beakerBrowserRPC.fetchBody
     beaker.browser.downloadURL = beakerBrowserRPC.downloadURL
+    beaker.browser.readFile = beakerBrowserRPC.readFile
     beaker.browser.getResourceContentType = beakerBrowserRPC.getResourceContentType
     beaker.browser.listBuiltinFavicons = beakerBrowserRPC.listBuiltinFavicons
     beaker.browser.getBuiltinFavicon = beakerBrowserRPC.getBuiltinFavicon
diff --git a/web-apis/manifests/internal/browser.js b/web-apis/manifests/internal/browser.js
index cd1c7743..6ffc0d7f 100644
--- a/web-apis/manifests/internal/browser.js
+++ b/web-apis/manifests/internal/browser.js
@@ -6,6 +6,7 @@ module.exports = {
 
   getUserSession: 'promise',
   setUserSession: 'promise',
+  showEditProfileModal: 'promise',
 
   getSettings: 'promise',
   getSetting: 'promise',
@@ -25,6 +26,7 @@ module.exports = {
 
   fetchBody: 'promise',
   downloadURL: 'promise',
+  readFile: 'promise',
 
   getResourceContentType: 'sync',
 

From 1ab95a6027bec1d86538198113880661a31dcdbe Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 13 Dec 2018 14:56:30 -0600
Subject: [PATCH 028/245] Fix first follow()

---
 crawler/followgraph.js | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index b85c3808..f8459d32 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -170,7 +170,7 @@ async function readFollowsFile (archive) {
   try {
     var followsJson = await archive.pda.readFile(JSON_PATH, 'utf8')
   } catch (e) {
-    if (e.notFound) return {urls: []} // empty default when not found
+    if (e.notFound) return {type: JSON_TYPE, urls: []} // empty default when not found
     throw e
   }
   followsJson = JSON.parse(followsJson)

From f6c30ecd03256c8703c1c7078032ce2c924584a4 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 13 Dec 2018 14:57:59 -0600
Subject: [PATCH 029/245] Add site-descriptions to crawler

---
 crawler/followgraph.js                     |  62 ++++-
 crawler/index.js                           |   8 +-
 crawler/posts.js                           |  38 +--
 crawler/site-descriptions.js               | 303 +++++++++++++++++++++
 crawler/util.js                            |  17 +-
 dbs/schemas/profile-data.sql.js            |  16 ++
 dbs/schemas/profile-data.v24.sql.js        |  16 ++
 web-apis/bg/followgraph.js                 |  14 +-
 web-apis/fg/beaker.js                      |   1 +
 web-apis/manifests/internal/followgraph.js |   1 +
 10 files changed, 431 insertions(+), 45 deletions(-)
 create mode 100644 crawler/site-descriptions.js

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index f8459d32..f3403161 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -5,6 +5,7 @@ const {Url} = require('url')
 const lock = require('../lib/lock')
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
+const siteDescriptions = require('./site-descriptions')
 const {doCrawl, doCheckpoint} = require('./util')
 const debug = require('../lib/debug-logger').debugLogger('crawler')
 
@@ -83,10 +84,11 @@ exports.crawlSite = async function (archive, crawlSource) {
   })
 }
 
-// List urls of sites that follow subject
+// List sites that follow subject
 // - subject. String (URL).
-// - returns Array<String>
-exports.listFollowers = async function (subject) {
+// - opts.includeDesc. Boolean.
+// - returns Array<String | Object>
+exports.listFollowers = async function (subject, {includeDesc} = {}) {
   var rows = await db.all(`
     SELECT crawl_sources.url
       FROM crawl_sources
@@ -94,13 +96,22 @@ exports.listFollowers = async function (subject) {
         ON crawl_followgraph.crawlSourceId = crawl_sources.id
         AND crawl_followgraph.destUrl = ?
   `, [subject])
-  return rows.map(row => toOrigin(row.url))
+  if (!includeDesc) {
+    return rows.map(row => toOrigin(row.url))
+  }
+  return Promise.all(rows.map(async (row) => {
+    var url = toOrigin(row.url)
+    var desc = await siteDescriptions.getBest({subject: url})
+    desc.url = url
+    return desc
+  }))
 }
 
-// List urls of sites that subject follows
+// List sites that subject follows
 // - subject. String (URL).
-// - returns Array<String>
-const listFollows = exports.listFollows = async function (subject) {
+// - opts.includeDesc. Boolean.
+// - returns Array<String | Object>
+const listFollows = exports.listFollows = async function (subject, {includeDesc} = {}) {
   var rows = await db.all(`
     SELECT crawl_followgraph.destUrl
       FROM crawl_followgraph
@@ -108,7 +119,29 @@ const listFollows = exports.listFollows = async function (subject) {
         ON crawl_followgraph.crawlSourceId = crawl_sources.id
         AND crawl_sources.url = ?
   `, [subject])
-  return rows.map(row => toOrigin(row.destUrl))
+  if (!includeDesc) {
+    return rows.map(row => toOrigin(row.destUrl))
+  }
+  return Promise.all(rows.map(async (row) => {
+    var url = toOrigin(row.destUrl)
+    var desc = await siteDescriptions.getBest({subject: url, author: subject})
+    desc.url = url
+    return desc
+  }))
+}
+
+// List sites that are followed by sites that the subject follows
+// - subject. String (URL).
+// - opts.includeDesc. Boolean.
+// - returns Array<String | Object>
+const listFoaFs = exports.listFoaFs = async function (subject, {includeDesc} = {}) {
+  var foafs = []
+  var follows = await listFollows(subject)
+  for (let url of follows) {
+    foafs = foafs.concat(await listFollows(url, {includeDesc}))
+  }
+  // TODO remove duplicates
+  return foafs
 }
 
 // Check for the existence of an individual follow
@@ -129,24 +162,29 @@ exports.isAFollowingB = async function (a, b) {
   return !!res
 }
 
-exports.follow = function (archive, followUrl) {
+exports.follow = async function (archive, followUrl) {
   // normalize followUrl
   followUrl = toOrigin(followUrl)
   assert(typeof followUrl === 'string', 'Follow() must be given a valid URL')
 
-  return updateFollowsFile(archive, followsJson => {
+  // write new follows.json
+  await updateFollowsFile(archive, followsJson => {
     if (!followsJson.urls.find(v => v === followUrl)) {
       followsJson.urls.push(followUrl)
     }
   })
+
+  // capture site description
+  /* dont await */siteDescriptions.capture(archive, followUrl)
 }
 
-exports.unfollow = function (archive, followUrl) {
+exports.unfollow = async function (archive, followUrl) {
   // normalize followUrl
   followUrl = toOrigin(followUrl)
   assert(typeof followUrl === 'string', 'Unfollow() must be given a valid URL')
 
-  return updateFollowsFile(archive, followsJson => {
+  // write new follows.json
+  await updateFollowsFile(archive, followsJson => {
     var i = followsJson.urls.findIndex(v => v === followUrl)
     if (i !== -1) {
       followsJson.urls.splice(i, 1)
diff --git a/crawler/index.js b/crawler/index.js
index 3a7e5c08..dd1a2ec4 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -6,6 +6,7 @@ const dat = require('../dat')
 
 const posts = require('./posts')
 const followgraph = require('./followgraph')
+const siteDescriptions = require('./site-descriptions')
 
 const CRAWL_POLL_INTERVAL = 30e3
 
@@ -19,6 +20,7 @@ const watches = {}
 
 exports.posts = posts
 exports.followgraph = followgraph
+exports.siteDescriptions = siteDescriptions
 
 exports.setup = async function () {
 }
@@ -75,10 +77,10 @@ exports.crawlSite = async function (archive) {
     // crawl individual sources
     await Promise.all([
       posts.crawlSite(archive, crawlSource),
-      followgraph.crawlSite(archive, crawlSource)
+      followgraph.crawlSite(archive, crawlSource),
+      siteDescriptions.crawlSite(archive, crawlSource)
     ])
   } finally {
     release()
   }
-}
-exports.crawlSite = crawlSite
\ No newline at end of file
+}
\ No newline at end of file
diff --git a/crawler/posts.js b/crawler/posts.js
index dc4c8f1f..8acefe9e 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -3,7 +3,7 @@ const {URL} = require('url')
 const Events = require('events')
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
-const {doCrawl, doCheckpoint, generateTimeFilename} = require('./util')
+const {doCrawl, doCheckpoint, getMatchingChangesInOrder, generateTimeFilename} = require('./util')
 const debug = require('../lib/debug-logger').debugLogger('crawler')
 
 // constants
@@ -38,16 +38,7 @@ exports.crawlSite = async function (archive, crawlSource) {
     }
 
     // collect changed posts
-    var changedPosts = [] // order matters, must be oldest to newest
-    changes.forEach(c => {
-      if (JSON_PATH_REGEX.test(c.name)) {
-        let i = changedPosts.findIndex(c2 => c2.name === c.name)
-        if (i !== -1) {
-          changedPosts.splice(i, 1) // remove from old position
-        }
-        changedPosts.push(c)
-      }
-    })
+    var changedPosts = getMatchingChangesInOrder(changes, JSON_PATH_REGEX)
     console.log('collected changed posts', changedPosts)
 
     // read and apply each post in order
@@ -106,21 +97,17 @@ exports.crawlSite = async function (archive, crawlSource) {
   })
 }
 
-exports.list = async function ({offset, limit, reverse, author, authors} = {}) {
+exports.list = async function ({offset, limit, reverse, author} = {}) {
   // validate & parse params
   assert(!offset || typeof offset === 'number', 'Offset must be a number')
   assert(!limit || typeof limit === 'number', 'Limit must be a number')
   assert(!reverse || typeof reverse === 'boolean', 'Reverse must be a boolean')
-  assert(!author || typeof author === 'string', 'Author must be a string')
-  assert(!authors || !Array.isArray(author), 'Authors must be an array of strings')
+  assert(!author || typeof author === 'string' || (Array.isArray(author) && author.every(isString)), 'Author must be a string or an array of strings')
 
   if (author) {
-    try { author = toOrigin(author) }
-    catch (e) { throw new Error('Author must be a valid URL') }
-  }
-  if (authors) {
-    try { authors = authors.map(toOrigin) }
-    catch (e) { throw new Error('Authors array must contain valid URLs') }
+    author = Array.isArray(author) ? author : [author]
+    try { author = author.map(toOrigin) }
+    catch (e) { throw new Error('Author must contain valid URLs') }
   }
 
   // build query
@@ -130,14 +117,11 @@ exports.list = async function ({offset, limit, reverse, author, authors} = {}) {
   `
   var values = []
   if (author) {
-    query += ` WHERE src.url = ?`
-    values.push(author)
-  } else if (authors) {
     let op = 'WHERE'
-    for (let author of authors) {
+    for (let a of author) {
       query += ` ${op} src.url = ?`
       op = 'OR'
-      values.push(author)
+      values.push(a)
     }
   }
   if (offset) {
@@ -213,6 +197,10 @@ exports.delete = async function (archive, pathname) {
 // internal methods
 // =
 
+function isString (v) {
+  return typeof v === 'string'
+}
+
 function toOrigin (url) {
   url = new URL(url)
   return url.protocol + '//' + url.hostname
diff --git a/crawler/site-descriptions.js b/crawler/site-descriptions.js
new file mode 100644
index 00000000..90d5e925
--- /dev/null
+++ b/crawler/site-descriptions.js
@@ -0,0 +1,303 @@
+const assert = require('assert')
+const {URL} = require('url')
+const Events = require('events')
+const _pick = require('lodash.pick')
+const db = require('../dbs/profile-data-db')
+const archivesDb = require('../dbs/archives')
+const dat = require('../dat')
+const crawler = require('./index')
+const {doCrawl, doCheckpoint, getMatchingChangesInOrder, generateTimeFilename} = require('./util')
+const debug = require('../lib/debug-logger').debugLogger('crawler')
+
+// constants
+// =
+
+const TABLE_VERSION = 1
+const JSON_TYPE = 'unwalled.garden/site-description'
+const JSON_PATH_REGEX = /^\/data\/known_sites\/([^/]+)\.json$/i
+
+// globals
+// =
+
+var events = new Events()
+
+// exported api
+// =
+
+exports.on = events.on.bind(events)
+exports.addListener = events.addListener.bind(events)
+exports.removeListener = events.removeListener.bind(events)
+
+exports.crawlSite = async function (archive, crawlSource) {
+  return doCrawl(archive, crawlSource, 'crawl_site_descriptions', TABLE_VERSION, async ({changes, resetRequired}) => {
+    const supressEvents = resetRequired === true // dont emit when replaying old info
+    console.log('Crawling site descriptions for', archive.url, {changes, resetRequired})
+    if (resetRequired) {
+      // reset all data
+      await db.run(`
+        DELETE FROM crawl_site_descriptions WHERE crawlSourceId = ?
+      `, [crawlSource.id])
+      await doCheckpoint('crawl_site_descriptions', TABLE_VERSION, crawlSource, 0)
+    }
+
+    // collect changed site descriptions
+    var changedSiteDescriptions = getMatchingChangesInOrder(changes, JSON_PATH_REGEX)
+    console.log('collected changed site descriptions', changedSiteDescriptions)
+
+    // read and apply each post in order
+    for (let changedSiteDescription of changedSiteDescriptions) {
+      // TODO Currently the crawler will abort reading the feed if any description fails to load
+      //      this means that a single bad or unreachable file can stop the forward progress of description indexing
+      //      to solve this, we need to find a way to tolerate bad description-files without losing our ability to efficiently detect new posts
+      //      -prf
+      if (changedSiteDescription.type === 'del') {
+        // delete
+        await db.run(`
+          DELETE FROM crawl_site_descriptions WHERE crawlSourceId = ? AND pathname = ?
+        `, [crawlSource.id, changedSiteDescription.name])
+        events.emit('description-removed', archive.url)
+      } else {
+        // read and validate
+        let desc
+        try {
+          desc = JSON.parse(await archive.pda.readFile(changedSiteDescription.name, 'utf8'))
+          assert(typeof desc === 'object', 'File be an object')
+          assert(desc.type === 'unwalled.garden/site-description', 'JSON .type must be unwalled.garden/site-description')
+          assert(typeof desc.subject === 'string', 'JSON .subject must be a URL string')
+          try { let subject = new URL(desc.subject) }
+          catch (e) { throw new Error('JSON .subject must be a URL string') }
+          assert(desc.metadata && typeof desc.metadata === 'object', 'JSON .metadata must be object')
+          assert(typeof desc.createdAt === 'string', 'JSON .createdAt must be a date-time')
+          assert(!isNaN(Number(new Date(desc.createdAt))), 'JSON .createdAt must be a date-time')
+        } catch (err) {
+          debug('Failed to read site-description file', {url: archive.url, name: changedSiteDescription.name, err})
+          return // abort indexing
+        }
+
+        // massage the description
+        desc.subject = toOrigin(desc.subject)
+        desc.metadata.title = typeof desc.metadata.title === 'string' ? desc.metadata.title : ''
+        desc.metadata.description = typeof desc.metadata.description === 'string' ? desc.metadata.description : ''
+        if (typeof desc.metadata.type === 'string') desc.metadata.type = desc.metadata.type.split(',')
+        if (Array.isArray(desc.metadata.type)) {
+          desc.metadata.type = desc.metadata.type.filter(isString)
+        } else {
+          desc.metadata.type = []
+        }
+        desc.createdAt = Number(new Date(desc.createdAt))
+
+        // replace
+        await db.run(`
+          DELETE FROM crawl_site_descriptions WHERE crawlSourceId = ? AND pathname = ?
+        `, [crawlSource.id, changedSiteDescription.name])
+        await db.run(`
+          INSERT OR REPLACE INTO crawl_site_descriptions (crawlSourceId, pathname, crawledAt, subject, title, description, type, createdAt)
+            VALUES (?, ?, ?, ?, ?, ?, ?, ?)
+        `, [crawlSource.id, changedSiteDescription.name, Date.now(), desc.subject, desc.metadata.title, desc.metadata.description, desc.metadata.type.join(','), desc.createdAt])
+        events.emit('description-added', archive.url)
+
+        // checkpoint our progress
+        await doCheckpoint('crawl_site_descriptions', TABLE_VERSION, crawlSource, changedSiteDescription.version)
+      }
+    }
+  })
+}
+
+const list = exports.list = async function ({offset, limit, reverse, author, subject} = {}) {
+  // validate & parse params
+  assert(!offset || typeof offset === 'number', 'Offset must be a number')
+  assert(!limit || typeof limit === 'number', 'Limit must be a number')
+  assert(!reverse || typeof reverse === 'boolean', 'Reverse must be a boolean')
+  assert(!author || typeof author === 'string' || (Array.isArray(author) && author.every(isString)), 'Author must be a string or an array of strings')
+  assert(!subject || typeof subject === 'string' || (Array.isArray(subject) && subject.every(isString)), 'Subject must be a string or an array of strings')
+
+  if (author) {
+    author = Array.isArray(author) ? author : [author]
+    try { author = author.map(toOrigin) }
+    catch (e) { throw new Error('Author must contain valid URLs') }
+  }
+  if (subject) {
+    subject = Array.isArray(subject) ? subject : [subject]
+    try { subject = subject.map(toOrigin) }
+    catch (e) { throw new Error('Subject must contain valid URLs') }
+  }
+
+  // build query
+  var query = `
+    SELECT crawl_site_descriptions.*, src.url AS crawlSourceUrl FROM crawl_site_descriptions
+      INNER JOIN crawl_sources src ON src.id = crawl_site_descriptions.crawlSourceId
+  `
+  var values = []
+  if (author) {
+    let op = 'WHERE'
+    for (let a of author) {
+      query += ` ${op} src.url = ?`
+      op = 'OR'
+      values.push(a)
+    }
+  }
+  if (subject) {
+    let op = 'WHERE'
+    for (let s of subject) {
+      query += ` ${op} subject = ?`
+      op = 'OR'
+      values.push(s)
+    }
+  }
+  if (offset) {
+    query += ` OFFSET ?`
+    values.push(offset)
+  }
+  if (limit) {
+    query += ` LIMIT ?`
+    values.push(limit)
+  }
+  query += ` ORDER BY createdAt`
+  if (reverse) {
+    query += ` DESC`
+  }
+
+  // execute query
+  return (await db.all(query, values)).map(massageSiteDescriptionRow)
+}
+
+exports.getBest = async function ({subject, author} = {}) {
+  // TODO
+  // while the archivesdb is more recent, it won't have the thumbnail
+  // -prf
+  // check archivesDb meta
+  // var meta = await archivesDb.getMeta(subject)
+  // if (meta) {
+  //   return _pick(meta, ['title', 'description', 'type'])
+  // }
+
+  // check for descriptions
+  console.log('getting best', subject, author)
+  var descriptions = await list({subject, author})
+  return _pick(descriptions[0] || {}, ['title', 'description', 'type', 'author'])
+}
+
+const get = exports.get = async function (url, pathname = undefined) {
+  // validate & parse params
+  if (url) {
+    try { url = new URL(url) }
+    catch (e) { throw new Error('Failed to parse post URL: ' + url) }
+  }
+  pathname = pathname || url.pathname
+
+  // execute query
+  return massageSiteDescriptionRow(await db.get(`
+    SELECT
+        crawl_site_descriptions.*, src.url AS crawlSourceUrl
+      FROM crawl_site_descriptions
+      INNER JOIN crawl_sources src
+        ON src.id = crawl_site_descriptions.crawlSourceId
+        AND src.url = ?
+      WHERE
+        crawl_site_descriptions.pathname = ?
+  `, [url.origin, pathname]))
+}
+
+exports.capture = async function (archive, subjectArchive) {
+  if (typeof subjectArchive === 'string') {
+    subjectArchive = await dat.library.getOrLoadArchive(subjectArchive)
+  }
+
+  // capture metadata
+  try {
+    var info = JSON.parse(await subjectArchive.pda.readFile('/dat.json'))
+  } catch (e) {
+    console.error('Failed to read dat.json of subject archive', e)
+    debug('Failed to read dat.json of subject archive', e)
+    throw new Error('Unabled to read subject dat.json')
+  }
+  await put(archive, {
+    subject: subjectArchive.url,
+    title: typeof info.title === 'string' ? info.title : undefined,
+    description: typeof info.description === 'string' ? info.description : undefined,
+    type: typeof info.type === 'string' || (Array.isArray(info.type) && info.type.every(isString)) ? info.type : undefined
+  })
+
+  // capture thumb
+  for (let ext of ['jpg', 'jpeg', 'png']) {
+    let thumbPath = `/thumb.${ext}`
+    if (await fileExists(subjectArchive, thumbPath)) {
+      let targetPath = `/data/known_sites/${toHostname(subjectArchive.url)}.${ext}`
+      await archive.pda.writeFile(targetPath, await subjectArchive.pda.readFile(thumbPath, 'binary'), 'binary')
+      break
+    }
+  }
+}
+
+const put =
+exports.put = async function (archive, {subject, title, description, type} = {}) {
+  assert(typeof subject === 'string', 'Put() must be provided a `subject` string')
+  try {
+    var subjectUrl = new URL(subject)
+  } catch (e) {
+    throw new Error('Put() `subject` must be a valid URL')
+  }
+  assert(!title || typeof title === 'string', 'Put() `title` must be a string')
+  assert(!description || typeof description === 'string', 'Put() `description` must be a string')
+  if (type) {
+    if (typeof type === 'string') type = type.split(',')
+    assert(Array.isArray(type), 'Put() `type` must be a string or an array of strings')
+    assert(type.every(isString), 'Put() `type` must be a string or an array of strings')
+  }
+  await ensureDirectory(archive, '/data')
+  await ensureDirectory(archive, '/data/known_sites')
+  await archive.pda.writeFile(`/data/known_sites/${subjectUrl.hostname}.json`, JSON.stringify({
+    type: JSON_TYPE,
+    subject: subjectUrl.toString(),
+    metadata: {
+      title,
+      description,
+      type
+    },
+    createdAt: (new Date()).toISOString()
+  }))
+  await crawler.crawlSite(archive)
+}
+
+exports.delete = async function (archive, pathname) {
+  assert(typeof pathname === 'string', 'Delete() must be provided a valid URL string')
+  await archive.pda.unlink(pathname)
+  await crawler.crawlSite(archive)
+}
+
+// internal methods
+// =
+
+function isString (v) {
+  return typeof v === 'string'
+}
+
+function toOrigin (url) {
+  url = new URL(url)
+  return url.protocol + '//' + url.hostname
+}
+
+function toHostname (url) {
+  url = new URL(url)
+  return url.hostname
+}
+
+async function ensureDirectory (archive, pathname) {
+  try { await archive.pda.mkdir(pathname) }
+  catch (e) { /* ignore */ }
+}
+
+async function fileExists (archive, pathname) {
+  try { await archive.pda.stat(pathname) }
+  catch (e) { return false }
+  return true
+}
+
+function massageSiteDescriptionRow (row) {
+  if (!row) return null
+  row.author = {url: row.crawlSourceUrl}
+  row.type = row.type && typeof row.type === 'string' ? row.type.split(',') : undefined
+  delete row.crawlSourceUrl
+  delete row.crawlSourceId
+  return row
+}
diff --git a/crawler/util.js b/crawler/util.js
index 02c008dc..aa22556f 100644
--- a/crawler/util.js
+++ b/crawler/util.js
@@ -40,9 +40,12 @@ exports.doCrawl = async function (archive, crawlSource, crawlDataset, crawlDatas
 
   // handle changes
   await handlerFn({changes, resetRequired})
+
+  // final checkpoint
+  await doCheckpoint(crawlDataset, crawlDatasetVersion, crawlSource, version)
 }
 
-exports.doCheckpoint = async function (crawlDataset, crawlDatasetVersion, crawlSource, crawlSourceVersion) {
+const doCheckpoint = exports.doCheckpoint = async function (crawlDataset, crawlDatasetVersion, crawlSource, crawlSourceVersion) {
   await db.run(`DELETE FROM crawl_sources_meta WHERE crawlDataset = ? AND crawlSourceId = ?`, [crawlDataset, crawlSource.id])
   await db.run(`
     INSERT
@@ -51,6 +54,18 @@ exports.doCheckpoint = async function (crawlDataset, crawlDatasetVersion, crawlS
   `, [crawlDataset, crawlDatasetVersion, crawlSource.id, crawlSourceVersion, Date.now()])
 }
 
+exports.getMatchingChangesInOrder = function (changes, regex) {
+  var list = [] // order matters, must be oldest to newest
+  changes.forEach(c => {
+    if (regex.test(c.name)) {
+      let i = list.findIndex(c2 => c2.name === c.name)
+      if (i !== -1) list.splice(i, 1) // remove from old position
+      list.push(c)
+    }
+  })
+  return list
+}
+
 var _lastGeneratedTimeFilename
 exports.generateTimeFilename = function () {
   var d = Date.now()
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index 6cb2e383..a3305441 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -117,6 +117,22 @@ CREATE TABLE crawl_sources_meta (
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
 
+-- crawled descriptions of other sites
+CREATE TABLE crawl_site_descriptions (
+  crawlSourceId INTEGER NOT NULL,
+  pathname TEXT NOT NULL,
+  crawledAt INTEGER,
+
+  subject TEXT,
+  title TEXT,
+  description TEXT,
+  type TEXT, -- comma separated strings
+  createdAt INTEGER,
+
+  PRIMARY KEY (crawlSourceId, pathname),
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+
 -- crawled posts
 CREATE TABLE crawl_posts (
   crawlSourceId INTEGER NOT NULL,
diff --git a/dbs/schemas/profile-data.v24.sql.js b/dbs/schemas/profile-data.v24.sql.js
index 2f769b70..e9b7bb71 100644
--- a/dbs/schemas/profile-data.v24.sql.js
+++ b/dbs/schemas/profile-data.v24.sql.js
@@ -24,6 +24,22 @@ CREATE TABLE crawl_sources_meta (
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
 
+-- crawled descriptions of other sites
+CREATE TABLE crawl_site_descriptions (
+  crawlSourceId INTEGER NOT NULL,
+  pathname TEXT NOT NULL,
+  crawledAt INTEGER,
+
+  subject TEXT,
+  title TEXT,
+  description TEXT,
+  type TEXT, -- comma separated strings
+  createdAt INTEGER,
+
+  PRIMARY KEY (crawlSourceId, pathname),
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+
 -- crawled posts
 CREATE TABLE crawl_posts (
   crawlSourceId INTEGER NOT NULL,
diff --git a/web-apis/bg/followgraph.js b/web-apis/bg/followgraph.js
index 4fee199d..ba07c3d6 100644
--- a/web-apis/bg/followgraph.js
+++ b/web-apis/bg/followgraph.js
@@ -10,16 +10,22 @@ const followgraphCrawler = require('../../crawler/followgraph')
 
 module.exports = {
 
-  async listFollowers (url) {
+  async listFollowers (url, opts) {
     url = normalizeFollowUrl(url)
     assertString(url, 'Parameter one must be a URL')
-    return followgraphCrawler.listFollowers(url)
+    return followgraphCrawler.listFollowers(url, opts)
   },
 
-  async listFollows (url) {
+  async listFollows (url, opts) {
     url = normalizeFollowUrl(url)
     assertString(url, 'Parameter one must be a URL')
-    return followgraphCrawler.listFollows(url)
+    return followgraphCrawler.listFollows(url, opts)
+  },
+
+  async listFoaFs (url, opts) {
+    url = normalizeFollowUrl(url)
+    assertString(url, 'Parameter one must be a URL')
+    return followgraphCrawler.listFoaFs(url, opts)
   },
 
   async isAFollowingB (a, b) {
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index 4af45a67..44511452 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -169,6 +169,7 @@ exports.setup = function (rpc) {
     beaker.followgraph = {}
     beaker.followgraph.listFollowers = followgraphRPC.listFollowers
     beaker.followgraph.listFollows = followgraphRPC.listFollows
+    beaker.followgraph.listFoaFs = followgraphRPC.listFoaFs
     beaker.followgraph.isAFollowingB = followgraphRPC.isAFollowingB
     beaker.followgraph.follow = followgraphRPC.follow
     beaker.followgraph.unfollow = followgraphRPC.unfollow
diff --git a/web-apis/manifests/internal/followgraph.js b/web-apis/manifests/internal/followgraph.js
index 2cb0fd6d..d4927e25 100644
--- a/web-apis/manifests/internal/followgraph.js
+++ b/web-apis/manifests/internal/followgraph.js
@@ -1,6 +1,7 @@
 module.exports = {
   listFollowers: 'promise',
   listFollows: 'promise',
+  listFoaFs: 'promise',
   isAFollowingB: 'promise',
   follow: 'promise',
   unfollow: 'promise'

From 041b7bc7eeb7526ab38d25ff9d56d32c69c01b04 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 13 Dec 2018 14:58:11 -0600
Subject: [PATCH 030/245] Add more export functions to daemon

---
 dat/daemon/index.js    | 10 ++++++++++
 dat/daemon/manifest.js |  2 ++
 2 files changed, 12 insertions(+)

diff --git a/dat/daemon/index.js b/dat/daemon/index.js
index 0aad5c42..4b25b8eb 100644
--- a/dat/daemon/index.js
+++ b/dat/daemon/index.js
@@ -331,6 +331,16 @@ const RPC_API = {
     configureAutoDownload(archive, userSettings)
   },
 
+  async exportFilesystemToArchive (opts) {
+    opts.dstArchive = getArchive(opts.dstArchive)
+    return pda.exportFilesystemToArchive(opts)
+  },
+
+  async exportArchiveToFilesystem (opts) {
+    opts.srcArchive = getArchive(opts.srcArchive)
+    return pda.exportFilesystemToArchive(opts)
+  },
+
   async exportArchiveToArchive (opts) {
     opts.srcArchive = getArchive(opts.srcArchive)
     opts.dstArchive = getArchive(opts.dstArchive)
diff --git a/dat/daemon/manifest.js b/dat/daemon/manifest.js
index 327d4514..c926f07a 100644
--- a/dat/daemon/manifest.js
+++ b/dat/daemon/manifest.js
@@ -26,6 +26,8 @@ module.exports = {
   callArchivePDAPromiseMethod: 'promise',
   callArchivePDAReadStreamMethod: 'readable',
   clearFileCache: 'promise',
+  exportFilesystemToArchive: 'async',
+  exportArchiveToFilesystem: 'async',
   exportArchiveToArchive: 'async',
 
   // folder sync

From d9e86aaf00d1393df2caa27b173397691adae641 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 13 Dec 2018 15:10:21 -0600
Subject: [PATCH 031/245] Fixes to the site-descriptions and FoaF algorithms

---
 crawler/followgraph.js       | 16 ++++++++++++++--
 crawler/site-descriptions.js | 25 ++++++++++++++++++-------
 2 files changed, 32 insertions(+), 9 deletions(-)

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index f3403161..13808de3 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -136,11 +136,23 @@ const listFollows = exports.listFollows = async function (subject, {includeDesc}
 // - returns Array<String | Object>
 const listFoaFs = exports.listFoaFs = async function (subject, {includeDesc} = {}) {
   var foafs = []
+  // list URLs followed by subject
   var follows = await listFollows(subject)
   for (let url of follows) {
-    foafs = foafs.concat(await listFollows(url, {includeDesc}))
+    // list follows of this follow
+    for (let foaf of await listFollows(url, {includeDesc})) {
+      // ignore if followed by subject
+      if (follows.indexOf(foaf.url) !== -1) continue
+      // merge into list
+      let existingFoaF = foafs.find(v => v.url === foaf.url)
+      if (existingFoaF) {
+        existingFoaF.followedBy.push(url)
+      } else {
+        foaf.followedBy = [url]
+        foafs.push(foaf)
+      }
+    }
   }
-  // TODO remove duplicates
   return foafs
 }
 
diff --git a/crawler/site-descriptions.js b/crawler/site-descriptions.js
index 90d5e925..7e9bb80d 100644
--- a/crawler/site-descriptions.js
+++ b/crawler/site-descriptions.js
@@ -128,21 +128,33 @@ const list = exports.list = async function ({offset, limit, reverse, author, sub
       INNER JOIN crawl_sources src ON src.id = crawl_site_descriptions.crawlSourceId
   `
   var values = []
+
+  if (author || subject) {
+    query += ` WHERE `
+  }
+
   if (author) {
-    let op = 'WHERE'
+    query += `(`
+    let op = ``
     for (let a of author) {
-      query += ` ${op} src.url = ?`
-      op = 'OR'
+      query += `${op} src.url = ?`
+      op = ` OR`
       values.push(a)
     }
+    query += `) `
   }
   if (subject) {
-    let op = 'WHERE'
+    if (author) {
+      query += ` AND `
+    }
+    query += `(`
+    let op = ``
     for (let s of subject) {
-      query += ` ${op} subject = ?`
-      op = 'OR'
+      query += `${op} subject = ?`
+      op = ` OR`
       values.push(s)
     }
+    query += `) `
   }
   if (offset) {
     query += ` OFFSET ?`
@@ -172,7 +184,6 @@ exports.getBest = async function ({subject, author} = {}) {
   // }
 
   // check for descriptions
-  console.log('getting best', subject, author)
   var descriptions = await list({subject, author})
   return _pick(descriptions[0] || {}, ['title', 'description', 'type', 'author'])
 }

From bb4b16ae192788e1dbe02db34e4b06fa72199f87 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 13 Dec 2018 17:19:52 -0600
Subject: [PATCH 032/245] Add more options and data to followgraph list
 functions

---
 crawler/followgraph.js | 25 ++++++++++++++-----------
 1 file changed, 14 insertions(+), 11 deletions(-)

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index 13808de3..cec6fecc 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -88,7 +88,7 @@ exports.crawlSite = async function (archive, crawlSource) {
 // - subject. String (URL).
 // - opts.includeDesc. Boolean.
 // - returns Array<String | Object>
-exports.listFollowers = async function (subject, {includeDesc} = {}) {
+const listFollowers = exports.listFollowers = async function (subject, {includeDesc} = {}) {
   var rows = await db.all(`
     SELECT crawl_sources.url
       FROM crawl_sources
@@ -110,8 +110,9 @@ exports.listFollowers = async function (subject, {includeDesc} = {}) {
 // List sites that subject follows
 // - subject. String (URL).
 // - opts.includeDesc. Boolean.
+// - opts.includeFollowers. Boolean. Requires includeDesc to be true.
 // - returns Array<String | Object>
-const listFollows = exports.listFollows = async function (subject, {includeDesc} = {}) {
+const listFollows = exports.listFollows = async function (subject, {includeDesc, includeFollowers} = {}) {
   var rows = await db.all(`
     SELECT crawl_followgraph.destUrl
       FROM crawl_followgraph
@@ -126,29 +127,31 @@ const listFollows = exports.listFollows = async function (subject, {includeDesc}
     var url = toOrigin(row.destUrl)
     var desc = await siteDescriptions.getBest({subject: url, author: subject})
     desc.url = url
+    if (includeFollowers) {
+      desc.followedBy = await listFollowers(url, {includeDesc: true})
+    }
     return desc
   }))
 }
 
 // List sites that are followed by sites that the subject follows
 // - subject. String (URL).
-// - opts.includeDesc. Boolean.
-// - returns Array<String | Object>
-const listFoaFs = exports.listFoaFs = async function (subject, {includeDesc} = {}) {
+// - returns Array<Object>
+const listFoaFs = exports.listFoaFs = async function (subject) {
   var foafs = []
   // list URLs followed by subject
-  var follows = await listFollows(subject)
-  for (let url of follows) {
+  var follows = await listFollows(subject, {includeDesc: true})
+  for (let follow of follows) {
     // list follows of this follow
-    for (let foaf of await listFollows(url, {includeDesc})) {
+    for (let foaf of await listFollows(follow.url, {includeDesc: true})) {
       // ignore if followed by subject
-      if (follows.indexOf(foaf.url) !== -1) continue
+      if (follows.find(v => v.url === foaf.url)) continue
       // merge into list
       let existingFoaF = foafs.find(v => v.url === foaf.url)
       if (existingFoaF) {
-        existingFoaF.followedBy.push(url)
+        existingFoaF.followedBy.push(follow)
       } else {
-        foaf.followedBy = [url]
+        foaf.followedBy = [follow]
         foafs.push(foaf)
       }
     }

From 4ef0203b6f1828cd939209c818389289bdf043fc Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 14 Dec 2018 11:23:09 -0600
Subject: [PATCH 033/245] Bump deps

---
 package-lock.json | 10 +++++++++-
 1 file changed, 9 insertions(+), 1 deletion(-)

diff --git a/package-lock.json b/package-lock.json
index bd6543ca..2133c6cc 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -2366,7 +2366,15 @@
       "dev": true,
       "requires": {
         "pseudomap": "^1.0.2",
-        "yallist": "^3.0.2"
+        "yallist": "^2.1.2"
+      },
+      "dependencies": {
+        "yallist": {
+          "version": "2.1.2",
+          "resolved": "https://registry.npmjs.org/yallist/-/yallist-2.1.2.tgz",
+          "integrity": "sha1-HBH5IY8HYImkfdUS+TxmmaaoHVI=",
+          "dev": true
+        }
       }
     },
     "map-age-cleaner": {

From e0caefe3b7a785c9b41364ed69101b4a26335577 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 14 Dec 2018 13:24:32 -0600
Subject: [PATCH 034/245] Add {followedBy} filter to followgraph

---
 crawler/followgraph.js     | 59 +++++++++++++++++++++++++++-----------
 web-apis/bg/followgraph.js | 12 ++++++++
 2 files changed, 55 insertions(+), 16 deletions(-)

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index cec6fecc..7fdaa958 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -63,9 +63,19 @@ exports.crawlSite = async function (archive, crawlSource) {
 
     // write updates
     for (let add of adds) {
-      await db.run(`
-        INSERT INTO crawl_followgraph (crawlSourceId, destUrl, crawledAt) VALUES (?, ?, ?)
-      `, [crawlSource.id, add, Date.now()])
+      try {
+        await db.run(`
+          INSERT INTO crawl_followgraph (crawlSourceId, destUrl, crawledAt) VALUES (?, ?, ?)
+        `, [crawlSource.id, add, Date.now()])
+      } catch (e) {
+        if (e.code === 'SQLITE_CONSTRAINT') {
+          // uniqueness constraint probably failed, which means we got a duplicate somehow
+          // dont worry about it
+          debug('Attempted to insert duplicate followgraph record', {crawlSource, url: add})
+        } else {
+          throw e
+        }
+      }
       if (!supressEvents) {
         events.emit('follow-added', archive.url, add)
       }
@@ -86,16 +96,31 @@ exports.crawlSite = async function (archive, crawlSource) {
 
 // List sites that follow subject
 // - subject. String (URL).
+// - opts.followedBy. String (URL).
 // - opts.includeDesc. Boolean.
 // - returns Array<String | Object>
-const listFollowers = exports.listFollowers = async function (subject, {includeDesc} = {}) {
-  var rows = await db.all(`
-    SELECT crawl_sources.url
-      FROM crawl_sources
-      INNER JOIN crawl_followgraph
-        ON crawl_followgraph.crawlSourceId = crawl_sources.id
-        AND crawl_followgraph.destUrl = ?
-  `, [subject])
+const listFollowers = exports.listFollowers = async function (subject, {followedBy, includeDesc} = {}) {
+  var rows
+  if (followedBy) {
+    rows = await db.all(`
+      SELECT cs.url FROM crawl_followgraph fg
+        INNER JOIN crawl_sources cs ON cs.id = fg.crawlSourceId
+        WHERE fg.destUrl = ?
+          AND (cs.url = ? OR cs.url IN (
+            SELECT destUrl as url FROM crawl_followgraph
+              INNER JOIN crawl_sources ON crawl_sources.id = crawl_followgraph.crawlSourceId
+              WHERE crawl_sources.url = ?
+          ))
+    `, [subject, followedBy, followedBy])
+  } else {
+    rows = await db.all(`
+      SELECT f.url
+        FROM crawl_sources f
+        INNER JOIN crawl_followgraph
+          ON crawl_followgraph.crawlSourceId = f.id
+          AND crawl_followgraph.destUrl = ?
+    `, [subject])
+  }
   if (!includeDesc) {
     return rows.map(row => toOrigin(row.url))
   }
@@ -109,10 +134,11 @@ const listFollowers = exports.listFollowers = async function (subject, {includeD
 
 // List sites that subject follows
 // - subject. String (URL).
+// - opts.followedBy. String (URL).
 // - opts.includeDesc. Boolean.
 // - opts.includeFollowers. Boolean. Requires includeDesc to be true.
 // - returns Array<String | Object>
-const listFollows = exports.listFollows = async function (subject, {includeDesc, includeFollowers} = {}) {
+const listFollows = exports.listFollows = async function (subject, {followedBy, includeDesc, includeFollowers} = {}) {
   var rows = await db.all(`
     SELECT crawl_followgraph.destUrl
       FROM crawl_followgraph
@@ -128,7 +154,7 @@ const listFollows = exports.listFollows = async function (subject, {includeDesc,
     var desc = await siteDescriptions.getBest({subject: url, author: subject})
     desc.url = url
     if (includeFollowers) {
-      desc.followedBy = await listFollowers(url, {includeDesc: true})
+      desc.followedBy = await listFollowers(url, {followedBy, includeDesc: true})
     }
     return desc
   }))
@@ -136,14 +162,15 @@ const listFollows = exports.listFollows = async function (subject, {includeDesc,
 
 // List sites that are followed by sites that the subject follows
 // - subject. String (URL).
+// - opts.followedBy. String (URL).
 // - returns Array<Object>
-const listFoaFs = exports.listFoaFs = async function (subject) {
+const listFoaFs = exports.listFoaFs = async function (subject, {followedBy} = {}) {
   var foafs = []
   // list URLs followed by subject
-  var follows = await listFollows(subject, {includeDesc: true})
+  var follows = await listFollows(subject, {followedBy, includeDesc: true})
   for (let follow of follows) {
     // list follows of this follow
-    for (let foaf of await listFollows(follow.url, {includeDesc: true})) {
+    for (let foaf of await listFollows(follow.url, {followedBy, includeDesc: true})) {
       // ignore if followed by subject
       if (follows.find(v => v.url === foaf.url)) continue
       // merge into list
diff --git a/web-apis/bg/followgraph.js b/web-apis/bg/followgraph.js
index ba07c3d6..ad903df3 100644
--- a/web-apis/bg/followgraph.js
+++ b/web-apis/bg/followgraph.js
@@ -11,20 +11,32 @@ const followgraphCrawler = require('../../crawler/followgraph')
 module.exports = {
 
   async listFollowers (url, opts) {
+    opts = opts || {}
     url = normalizeFollowUrl(url)
     assertString(url, 'Parameter one must be a URL')
+    var userSession = globals.userSessionAPI.getFor(this.sender)
+    if (!userSession) throw new Error('No active user session')
+    opts.followedBy = userSession.url
     return followgraphCrawler.listFollowers(url, opts)
   },
 
   async listFollows (url, opts) {
+    opts = opts || {}
     url = normalizeFollowUrl(url)
     assertString(url, 'Parameter one must be a URL')
+    var userSession = globals.userSessionAPI.getFor(this.sender)
+    if (!userSession) throw new Error('No active user session')
+    opts.followedBy = userSession.url
     return followgraphCrawler.listFollows(url, opts)
   },
 
   async listFoaFs (url, opts) {
+    opts = opts || {}
     url = normalizeFollowUrl(url)
     assertString(url, 'Parameter one must be a URL')
+    var userSession = globals.userSessionAPI.getFor(this.sender)
+    if (!userSession) throw new Error('No active user session')
+    opts.followedBy = userSession.url
     return followgraphCrawler.listFoaFs(url, opts)
   },
 

From d9ed01292dff60c2ae2072ed48838428940df84e Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 14 Dec 2018 14:19:25 -0600
Subject: [PATCH 035/245] Add .followsUser output to followgraph queries

---
 crawler/followgraph.js | 10 ++++++++--
 1 file changed, 8 insertions(+), 2 deletions(-)

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index 7fdaa958..9b8dbbc1 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -128,13 +128,16 @@ const listFollowers = exports.listFollowers = async function (subject, {followed
     var url = toOrigin(row.url)
     var desc = await siteDescriptions.getBest({subject: url})
     desc.url = url
+    if (followedBy) {
+      desc.followsUser = await isAFollowingB(url, followedBy)
+    }
     return desc
   }))
 }
 
 // List sites that subject follows
 // - subject. String (URL).
-// - opts.followedBy. String (URL).
+// - opts.followedBy. String (URL). Filters to users who are followed by the URL specified. Causes .followsUser boolean to be set.
 // - opts.includeDesc. Boolean.
 // - opts.includeFollowers. Boolean. Requires includeDesc to be true.
 // - returns Array<String | Object>
@@ -153,6 +156,9 @@ const listFollows = exports.listFollows = async function (subject, {followedBy,
     var url = toOrigin(row.destUrl)
     var desc = await siteDescriptions.getBest({subject: url, author: subject})
     desc.url = url
+    if (followedBy) {
+      desc.followsUser = await isAFollowingB(url, followedBy)
+    }
     if (includeFollowers) {
       desc.followedBy = await listFollowers(url, {followedBy, includeDesc: true})
     }
@@ -190,7 +196,7 @@ const listFoaFs = exports.listFoaFs = async function (subject, {followedBy} = {}
 // - a. String (URL), the site being queried.
 // - b. String (URL), does a follow this site?
 // - returns bool
-exports.isAFollowingB = async function (a, b) {
+const isAFollowingB = exports.isAFollowingB = async function (a, b) {
   a = toOrigin(a)
   b = toOrigin(b)
   var res = await db.get(`

From 9f534806a554e0050ac620903f247b26e9b9d176 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 15 Dec 2018 14:40:07 -0600
Subject: [PATCH 036/245] Filter out the subject from listFoaFs

---
 crawler/followgraph.js | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index 9b8dbbc1..af32237a 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -168,7 +168,7 @@ const listFollows = exports.listFollows = async function (subject, {followedBy,
 
 // List sites that are followed by sites that the subject follows
 // - subject. String (URL).
-// - opts.followedBy. String (URL).
+// - opts.followedBy. String (URL). Filters to users who are followed by the URL specified. Causes .followsUser boolean to be set.
 // - returns Array<Object>
 const listFoaFs = exports.listFoaFs = async function (subject, {followedBy} = {}) {
   var foafs = []
@@ -177,7 +177,8 @@ const listFoaFs = exports.listFoaFs = async function (subject, {followedBy} = {}
   for (let follow of follows) {
     // list follows of this follow
     for (let foaf of await listFollows(follow.url, {followedBy, includeDesc: true})) {
-      // ignore if followed by subject
+      // ignore if followed by subject or is subject
+      if (foaf.url === subject) continue
       if (follows.find(v => v.url === foaf.url)) continue
       // merge into list
       let existingFoaF = foafs.find(v => v.url === foaf.url)

From 8581969097bc57906fbf55fad0c6ffb4712f9eac Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 15 Dec 2018 18:04:42 -0600
Subject: [PATCH 037/245] Add beaker.browser.showShellModal

---
 web-apis/fg/beaker.js                  | 1 +
 web-apis/manifests/internal/browser.js | 1 +
 2 files changed, 2 insertions(+)

diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index 44511452..30a2fbe3 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -95,6 +95,7 @@ exports.setup = function (rpc) {
     beaker.browser.setWindowDimensions = beakerBrowserRPC.setWindowDimensions
     beaker.browser.showOpenDialog = beakerBrowserRPC.showOpenDialog
     beaker.browser.showContextMenu = beakerBrowserRPC.showContextMenu
+    beaker.browser.showShellModal = beakerBrowserRPC.showShellModal
     beaker.browser.openUrl = beakerBrowserRPC.openUrl
     beaker.browser.openFolder = beakerBrowserRPC.openFolder
     beaker.browser.doWebcontentsCmd = beakerBrowserRPC.doWebcontentsCmd
diff --git a/web-apis/manifests/internal/browser.js b/web-apis/manifests/internal/browser.js
index 6ffc0d7f..7eb661cb 100644
--- a/web-apis/manifests/internal/browser.js
+++ b/web-apis/manifests/internal/browser.js
@@ -33,6 +33,7 @@ module.exports = {
   setWindowDimensions: 'promise',
   showOpenDialog: 'promise',
   showContextMenu: 'promise',
+  showShellModal: 'promise',
   openUrl: 'promise',
   openFolder: 'promise',
   doWebcontentsCmd: 'promise',

From 78a3c7fb42289276de4113be2a92c911d58502a2 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 17 Dec 2018 16:21:22 -0600
Subject: [PATCH 038/245] Add beaker.crawler API

---
 crawler/index.js                       | 52 +++++++++++++++++++++++++-
 crawler/util.js                        |  9 +++++
 web-apis/bg.js                         |  3 ++
 web-apis/fg/beaker.js                  |  8 ++++
 web-apis/manifests/internal/crawler.js |  5 +++
 5 files changed, 76 insertions(+), 1 deletion(-)
 create mode 100644 web-apis/manifests/internal/crawler.js

diff --git a/crawler/index.js b/crawler/index.js
index dd1a2ec4..ea9aa953 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -1,9 +1,13 @@
+const emitStream = require('emit-stream')
+const {URL} = require('url')
 const _throttle = require('lodash.throttle')
 const lock = require('../lib/lock')
 const db = require('../dbs/profile-data-db')
+const archivesDb = require('../dbs/archives')
 const users = require('../users')
 const dat = require('../dat')
 
+const {crawlerEvents} = require('./util')
 const posts = require('./posts')
 const followgraph = require('./followgraph')
 const siteDescriptions = require('./site-descriptions')
@@ -21,6 +25,7 @@ const watches = {}
 exports.posts = posts
 exports.followgraph = followgraph
 exports.siteDescriptions = siteDescriptions
+const createEventsStream = exports.createEventsStream = () => emitStream(crawlerEvents)
 
 exports.setup = async function () {
 }
@@ -32,6 +37,7 @@ exports.watchSite = async function (archive) {
   console.log('watchSite', archive.url)
 
   if (!(archive.url in watches)) {
+    crawlerEvents.emit('watch', {sourceUrl: archive.url})
     const queueCrawl = _throttle(() => crawlSite(archive), 5e3)
 
     // watch for file changes
@@ -57,6 +63,7 @@ exports.watchSite = async function (archive) {
 exports.unwatchSite = async function (url) {
   // stop watching for file changes
   if (url in watches) {
+    crawlerEvents.emit('unwatch', {sourceUrl: url})
     watches[url].close()
     watches[url] = null
   }
@@ -65,6 +72,7 @@ exports.unwatchSite = async function (url) {
 const crawlSite =
 exports.crawlSite = async function (archive) {
   console.log('crawling', archive.url)
+  crawlerEvents.emit('crawl-start', {sourceUrl: archive.url})
   var release = await lock('crawl:' + archive.url)
   try {
     // get/create crawl source
@@ -80,7 +88,49 @@ exports.crawlSite = async function (archive) {
       followgraph.crawlSite(archive, crawlSource),
       siteDescriptions.crawlSite(archive, crawlSource)
     ])
+  } catch (err) {
+    crawlerEvents.emit('crawl-error', {sourceUrl: archive.url, err: err.toString()})
   } finally {
+    crawlerEvents.emit('crawl-finish', {sourceUrl: archive.url})
     release()
   }
-}
\ No newline at end of file
+}
+
+const getCrawlStates =
+exports.getCrawlStates = async function () {
+  var rows = await db.all(`
+    SELECT
+        crawl_sources.url AS url,
+        GROUP_CONCAT(crawl_sources_meta.crawlSourceVersion) AS versions,
+        GROUP_CONCAT(crawl_sources_meta.crawlDataset) AS datasets,
+        MAX(crawl_sources_meta.updatedAt) AS updatedAt
+      FROM crawl_sources
+      INNER JOIN crawl_sources_meta ON crawl_sources_meta.crawlSourceId = crawl_sources.id
+      GROUP BY crawl_sources.id
+  `)
+  return Promise.all(rows.map(async ({url, versions, datasets, updatedAt}) => {
+    var datasetVersions = {}
+    versions = versions.split(',')
+    datasets = datasets.split(',')
+    for (let i = 0; i < datasets.length; i++) {
+      datasetVersions[datasets[i]] = Number(versions[i])
+    }
+    var meta = await archivesDb.getMeta(toHostname(url))
+    return {url, title: meta.title, datasetVersions, updatedAt}
+  }))
+}
+
+const resetSite =
+exports.resetSite = async function (url) {
+  await db.run(`DELETE FROM crawl_sources WHERE url = ?`, [url])
+}
+
+exports.WEBAPI = {createEventsStream, getCrawlStates, resetSite}
+
+// internal methods
+// =
+
+function toHostname (url) {
+  url = new URL(url)
+  return url.hostname
+}
diff --git a/crawler/util.js b/crawler/util.js
index aa22556f..98c984a4 100644
--- a/crawler/util.js
+++ b/crawler/util.js
@@ -1,3 +1,4 @@
+const EventEmitter = require('events')
 const pump = require('pump')
 const concat = require('concat-stream')
 const db = require('../dbs/profile-data-db')
@@ -5,6 +6,9 @@ const dat = require('../dat')
 
 const READ_TIMEOUT = 30e3
 
+const crawlerEvents = new EventEmitter()
+exports.crawlerEvents = crawlerEvents
+
 exports.doCrawl = async function (archive, crawlSource, crawlDataset, crawlDatasetVersion, handlerFn) {
   const url = archive.url
 
@@ -38,14 +42,19 @@ exports.doCrawl = async function (archive, crawlSource, crawlDataset, crawlDatas
     )
   })
 
+  crawlerEvents.emit('crawl-dataset-start', {sourceUrl: archive.url, crawlDataset, crawlRange: {start, end}})
+
   // handle changes
   await handlerFn({changes, resetRequired})
 
   // final checkpoint
   await doCheckpoint(crawlDataset, crawlDatasetVersion, crawlSource, version)
+
+  crawlerEvents.emit('crawl-dataset-finish', {sourceUrl: archive.url, crawlDataset, crawlRange: {start, end}})
 }
 
 const doCheckpoint = exports.doCheckpoint = async function (crawlDataset, crawlDatasetVersion, crawlSource, crawlSourceVersion) {
+  crawlerEvents.emit('crawl-dataset-progress', {sourceUrl: crawlSource.url, crawlDataset, crawledVersion: crawlSourceVersion})
   await db.run(`DELETE FROM crawl_sources_meta WHERE crawlDataset = ? AND crawlSourceId = ?`, [crawlDataset, crawlSource.id])
   await db.run(`
     INSERT
diff --git a/web-apis/bg.js b/web-apis/bg.js
index e3d16b38..ac74937f 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -10,6 +10,7 @@ const downloadsManifest = require('./manifests/internal/downloads')
 const historyManifest = require('./manifests/internal/history')
 const sitedataManifest = require('./manifests/internal/sitedata')
 const watchlistManifest = require('./manifests/internal/watchlist')
+const crawlerManifest = require('./manifests/internal/crawler')
 const postsManifest = require('./manifests/internal/posts')
 const followgraphManifest = require('./manifests/internal/followgraph')
 
@@ -19,6 +20,7 @@ const bookmarksAPI = require('./bg/bookmarks')
 const historyAPI = require('./bg/history')
 const sitedataAPI = require('../dbs/sitedata').WEBAPI
 const watchlistAPI = require('./bg/watchlist')
+const crawlerAPI = require('../crawler').WEBAPI
 const postsAPI = require('./bg/posts')
 const followgraphAPI = require('./bg/followgraph')
 
@@ -54,6 +56,7 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('history', historyManifest, historyAPI, internalOnly)
   globals.rpcAPI.exportAPI('sitedata', sitedataManifest, sitedataAPI, internalOnly)
   globals.rpcAPI.exportAPI('watchlist', watchlistManifest, watchlistAPI, internalOnly)
+  globals.rpcAPI.exportAPI('crawler', crawlerManifest, crawlerAPI, internalOnly)
   globals.rpcAPI.exportAPI('posts', postsManifest, postsAPI, internalOnly)
   globals.rpcAPI.exportAPI('followgraph', followgraphManifest, followgraphAPI, internalOnly)
 
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index 30a2fbe3..54ee141a 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -8,6 +8,7 @@ const downloadsManifest = require('../manifests/internal/downloads')
 const historyManifest = require('../manifests/internal/history')
 const sitedataManifest = require('../manifests/internal/sitedata')
 const watchlistManifest = require('../manifests/internal/watchlist')
+const crawlerManifest = require('../manifests/internal/crawler')
 const postsManifest = require('../manifests/internal/posts')
 const followgraphManifest = require('../manifests/internal/followgraph')
 
@@ -24,6 +25,7 @@ exports.setup = function (rpc) {
     const historyRPC = rpc.importAPI('history', historyManifest, opts)
     const sitedataRPC = rpc.importAPI('sitedata', sitedataManifest, opts)
     const watchlistRPC = rpc.importAPI('watchlist', watchlistManifest, opts)
+    const crawlerRPC = rpc.importAPI('crawler', crawlerManifest, opts)
     const postsRPC = rpc.importAPI('posts', postsManifest, opts)
     const followgraphRPC = rpc.importAPI('followgraph', followgraphManifest, opts)
 
@@ -158,6 +160,12 @@ exports.setup = function (rpc) {
     beaker.watchlist.remove = watchlistRPC.remove
     beaker.watchlist.createEventsStream = () => fromEventStream(watchlistRPC.createEventsStream())
 
+    // beaker.crawler
+    beaker.crawler = {}
+    beaker.crawler.getCrawlStates = crawlerRPC.getCrawlStates
+    beaker.crawler.resetSite = crawlerRPC.resetSite
+    beaker.crawler.createEventsStream = () => fromEventStream(crawlerRPC.createEventsStream())
+
     // beaker.posts
     beaker.posts = {}
     beaker.posts.list = postsRPC.list
diff --git a/web-apis/manifests/internal/crawler.js b/web-apis/manifests/internal/crawler.js
new file mode 100644
index 00000000..686ac47a
--- /dev/null
+++ b/web-apis/manifests/internal/crawler.js
@@ -0,0 +1,5 @@
+module.exports = {
+  getCrawlStates: 'promise',
+  resetSite: 'promise',
+  createEventsStream: 'readable'
+}

From 2cdcd3d65d081dbb2294b1d047c8744d76bc691b Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 17 Dec 2018 18:59:15 -0600
Subject: [PATCH 039/245] Add beaker.crawler.crawlSite

---
 crawler/index.js                       | 10 +++++++++-
 web-apis/fg/beaker.js                  |  1 +
 web-apis/manifests/internal/crawler.js |  1 +
 3 files changed, 11 insertions(+), 1 deletion(-)

diff --git a/crawler/index.js b/crawler/index.js
index ea9aa953..8e997cb2 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -125,7 +125,15 @@ exports.resetSite = async function (url) {
   await db.run(`DELETE FROM crawl_sources WHERE url = ?`, [url])
 }
 
-exports.WEBAPI = {createEventsStream, getCrawlStates, resetSite}
+exports.WEBAPI = {
+  createEventsStream,
+  getCrawlStates,
+  crawlSite: async (url) => {
+    var archive = await dat.library.getOrLoadArchive(url)
+    return crawlSite(archive)
+  },
+  resetSite
+}
 
 // internal methods
 // =
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index 54ee141a..81c420ad 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -163,6 +163,7 @@ exports.setup = function (rpc) {
     // beaker.crawler
     beaker.crawler = {}
     beaker.crawler.getCrawlStates = crawlerRPC.getCrawlStates
+    beaker.crawler.crawlSite = crawlerRPC.crawlSite
     beaker.crawler.resetSite = crawlerRPC.resetSite
     beaker.crawler.createEventsStream = () => fromEventStream(crawlerRPC.createEventsStream())
 
diff --git a/web-apis/manifests/internal/crawler.js b/web-apis/manifests/internal/crawler.js
index 686ac47a..47365431 100644
--- a/web-apis/manifests/internal/crawler.js
+++ b/web-apis/manifests/internal/crawler.js
@@ -1,5 +1,6 @@
 module.exports = {
   getCrawlStates: 'promise',
+  crawlSite: 'promise',
   resetSite: 'promise',
   createEventsStream: 'readable'
 }

From 2d808973f006d81504f37d76d4f133cac1e270f1 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 18 Dec 2018 11:38:29 -0600
Subject: [PATCH 040/245] Enable foreign keys in sqlite

---
 lib/db.js | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/lib/db.js b/lib/db.js
index 780e4956..94a4bf29 100644
--- a/lib/db.js
+++ b/lib/db.js
@@ -49,6 +49,13 @@ exports.makeSqliteTransactor = function (setupPromise) {
 // runs needed migrations, returns a promise
 exports.setupSqliteDB = function (db, {setup, migrations}, logTag) {
   return new Promise((resolve, reject) => {
+    // configure connection
+    db.run('PRAGMA foreign_keys = ON;', (err) => {
+      if (err) {
+        console.error('Failed to enable FK support in SQLite', err)
+      }
+    })
+
     // run migrations
     db.get('PRAGMA user_version;', (err, res) => {
       if (err) return reject(err)

From c13cf914a6efea9cdf0d3fe5fffef7be48416a48 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 18 Dec 2018 11:38:41 -0600
Subject: [PATCH 041/245] Rework crawler progress events

---
 crawler/followgraph.js       |  5 ++++-
 crawler/posts.js             | 11 +++++++----
 crawler/site-descriptions.js | 11 +++++++----
 crawler/util.js              |  6 +++++-
 4 files changed, 23 insertions(+), 10 deletions(-)

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index af32237a..0340117d 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -6,7 +6,7 @@ const lock = require('../lib/lock')
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
 const siteDescriptions = require('./site-descriptions')
-const {doCrawl, doCheckpoint} = require('./util')
+const {doCrawl, doCheckpoint, emitProgressEvent} = require('./util')
 const debug = require('../lib/debug-logger').debugLogger('crawler')
 
 // constants
@@ -46,6 +46,8 @@ exports.crawlSite = async function (archive, crawlSource) {
       return
     }
 
+    emitProgressEvent(archive.url, 'crawl_followgraph', 0, 1)
+
     // read and validate
     try {
       var followsJson = await readFollowsFile(archive)
@@ -91,6 +93,7 @@ exports.crawlSite = async function (archive, crawlSource) {
 
     // write checkpoint as success
     await doCheckpoint('crawl_followgraph', TABLE_VERSION, crawlSource, changes[changes.length - 1].version)
+    emitProgressEvent(archive.url, 'crawl_followgraph', 1, 1)
   })
 }
 
diff --git a/crawler/posts.js b/crawler/posts.js
index 8acefe9e..32db063a 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -3,7 +3,7 @@ const {URL} = require('url')
 const Events = require('events')
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
-const {doCrawl, doCheckpoint, getMatchingChangesInOrder, generateTimeFilename} = require('./util')
+const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename} = require('./util')
 const debug = require('../lib/debug-logger').debugLogger('crawler')
 
 // constants
@@ -40,8 +40,10 @@ exports.crawlSite = async function (archive, crawlSource) {
     // collect changed posts
     var changedPosts = getMatchingChangesInOrder(changes, JSON_PATH_REGEX)
     console.log('collected changed posts', changedPosts)
+    emitProgressEvent(archive.url, 'crawl_posts', 0, changedPosts.length)
 
     // read and apply each post in order
+    var progress = 0
     for (let changedPost of changedPosts) {
       // TODO Currently the crawler will abort reading the feed if any post fails to load
       //      this means that a single bad or unreachable file can stop the forward progress of post indexing
@@ -89,10 +91,11 @@ exports.crawlSite = async function (archive, crawlSource) {
           `, [crawlSource.id, changedPost.name, Date.now(), post.content, post.createdAt, post.updatedAt])
           events.emit('post-added', archive.url)
         }
-
-        // checkpoint our progress
-        await doCheckpoint('crawl_posts', TABLE_VERSION, crawlSource, changedPost.version)
       }
+
+      // checkpoint our progress
+      await doCheckpoint('crawl_posts', TABLE_VERSION, crawlSource, changedPost.version)
+      emitProgressEvent(archive.url, 'crawl_posts', ++progress, changedPosts.length)
     }
   })
 }
diff --git a/crawler/site-descriptions.js b/crawler/site-descriptions.js
index 7e9bb80d..d92ac1e4 100644
--- a/crawler/site-descriptions.js
+++ b/crawler/site-descriptions.js
@@ -6,7 +6,7 @@ const db = require('../dbs/profile-data-db')
 const archivesDb = require('../dbs/archives')
 const dat = require('../dat')
 const crawler = require('./index')
-const {doCrawl, doCheckpoint, getMatchingChangesInOrder, generateTimeFilename} = require('./util')
+const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename} = require('./util')
 const debug = require('../lib/debug-logger').debugLogger('crawler')
 
 // constants
@@ -43,8 +43,10 @@ exports.crawlSite = async function (archive, crawlSource) {
     // collect changed site descriptions
     var changedSiteDescriptions = getMatchingChangesInOrder(changes, JSON_PATH_REGEX)
     console.log('collected changed site descriptions', changedSiteDescriptions)
+    emitProgressEvent(archive.url, 'crawl_site_descriptions', 0, changedSiteDescriptions.length)
 
     // read and apply each post in order
+    var progress = 0
     for (let changedSiteDescription of changedSiteDescriptions) {
       // TODO Currently the crawler will abort reading the feed if any description fails to load
       //      this means that a single bad or unreachable file can stop the forward progress of description indexing
@@ -95,10 +97,11 @@ exports.crawlSite = async function (archive, crawlSource) {
             VALUES (?, ?, ?, ?, ?, ?, ?, ?)
         `, [crawlSource.id, changedSiteDescription.name, Date.now(), desc.subject, desc.metadata.title, desc.metadata.description, desc.metadata.type.join(','), desc.createdAt])
         events.emit('description-added', archive.url)
-
-        // checkpoint our progress
-        await doCheckpoint('crawl_site_descriptions', TABLE_VERSION, crawlSource, changedSiteDescription.version)
       }
+
+      // checkpoint our progress
+      await doCheckpoint('crawl_site_descriptions', TABLE_VERSION, crawlSource, changedSiteDescription.version)
+      emitProgressEvent(archive.url, 'crawl_site_descriptions', ++progress, changedSiteDescription.length)
     }
   })
 }
diff --git a/crawler/util.js b/crawler/util.js
index 98c984a4..cbd3c549 100644
--- a/crawler/util.js
+++ b/crawler/util.js
@@ -54,7 +54,7 @@ exports.doCrawl = async function (archive, crawlSource, crawlDataset, crawlDatas
 }
 
 const doCheckpoint = exports.doCheckpoint = async function (crawlDataset, crawlDatasetVersion, crawlSource, crawlSourceVersion) {
-  crawlerEvents.emit('crawl-dataset-progress', {sourceUrl: crawlSource.url, crawlDataset, crawledVersion: crawlSourceVersion})
+  
   await db.run(`DELETE FROM crawl_sources_meta WHERE crawlDataset = ? AND crawlSourceId = ?`, [crawlDataset, crawlSource.id])
   await db.run(`
     INSERT
@@ -63,6 +63,10 @@ const doCheckpoint = exports.doCheckpoint = async function (crawlDataset, crawlD
   `, [crawlDataset, crawlDatasetVersion, crawlSource.id, crawlSourceVersion, Date.now()])
 }
 
+exports.emitProgressEvent = function (sourceUrl, crawlDataset, progress, numUpdates) {
+  crawlerEvents.emit('crawl-dataset-progress', {sourceUrl, crawlDataset, progress, numUpdates})
+}
+
 exports.getMatchingChangesInOrder = function (changes, regex) {
   var list = [] // order matters, must be oldest to newest
   changes.forEach(c => {

From 2b562f6c0092b00654cab1e2d02ea8efae3edba5 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 23 Dec 2018 17:29:08 -0600
Subject: [PATCH 042/245] Add beaker.templates internal web api

---
 crawler/util.js                          |  1 -
 dbs/schemas/profile-data.sql.js          | 25 ++++++++++++------------
 web-apis/bg.js                           |  3 +++
 web-apis/bg/archives.js                  | 20 -------------------
 web-apis/bg/templates.js                 | 22 +++++++++++++++++++++
 web-apis/fg/beaker.js                    | 13 ++++++++----
 web-apis/manifests/internal/archives.js  |  6 ------
 web-apis/manifests/internal/templates.js |  6 ++++++
 8 files changed, 52 insertions(+), 44 deletions(-)
 create mode 100644 web-apis/bg/templates.js
 create mode 100644 web-apis/manifests/internal/templates.js

diff --git a/crawler/util.js b/crawler/util.js
index cbd3c549..04a9f7b2 100644
--- a/crawler/util.js
+++ b/crawler/util.js
@@ -54,7 +54,6 @@ exports.doCrawl = async function (archive, crawlSource, crawlDataset, crawlDatas
 }
 
 const doCheckpoint = exports.doCheckpoint = async function (crawlDataset, crawlDatasetVersion, crawlSource, crawlSourceVersion) {
-  
   await db.run(`DELETE FROM crawl_sources_meta WHERE crawlDataset = ? AND crawlSourceId = ?`, [crawlDataset, crawlSource.id])
   await db.run(`
     INSERT
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index a3305441..3879146e 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -100,6 +100,18 @@ CREATE TABLE watchlist (
   FOREIGN KEY (profileId) REFERENCES profiles (id) ON DELETE CASCADE
 );
 
+-- list of the users current templates
+CREATE TABLE templates (
+  profileId INTEGER,
+  url TEXT NOT NULL,
+  title TEXT,
+  screenshot,
+  createdAt INTEGER DEFAULT (strftime('%s', 'now')),
+
+  PRIMARY KEY (profileId, url),
+  FOREIGN KEY (profileId) REFERENCES profiles (id) ON DELETE CASCADE
+);
+
 -- list of sites being crawled
 CREATE TABLE crawl_sources (
   id INTEGER PRIMARY KEY NOT NULL,
@@ -157,19 +169,6 @@ CREATE TABLE crawl_followgraph (
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
 
--- list of the users current templates
--- deprecated (may return)
-CREATE TABLE templates (
-  profileId INTEGER,
-  url TEXT NOT NULL,
-  title TEXT,
-  screenshot,
-  createdAt INTEGER DEFAULT (strftime('%s', 'now')),
-
-  PRIMARY KEY (profileId, url),
-  FOREIGN KEY (profileId) REFERENCES profiles (id) ON DELETE CASCADE
-);
-
 -- a list of the draft-dats for a master-dat
 -- deprecated
 CREATE TABLE archive_drafts (
diff --git a/web-apis/bg.js b/web-apis/bg.js
index ac74937f..df7bfd95 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -10,6 +10,7 @@ const downloadsManifest = require('./manifests/internal/downloads')
 const historyManifest = require('./manifests/internal/history')
 const sitedataManifest = require('./manifests/internal/sitedata')
 const watchlistManifest = require('./manifests/internal/watchlist')
+const templatesManifest = require('./manifests/internal/templates')
 const crawlerManifest = require('./manifests/internal/crawler')
 const postsManifest = require('./manifests/internal/posts')
 const followgraphManifest = require('./manifests/internal/followgraph')
@@ -20,6 +21,7 @@ const bookmarksAPI = require('./bg/bookmarks')
 const historyAPI = require('./bg/history')
 const sitedataAPI = require('../dbs/sitedata').WEBAPI
 const watchlistAPI = require('./bg/watchlist')
+const templatesAPI = require('./bg/templates')
 const crawlerAPI = require('../crawler').WEBAPI
 const postsAPI = require('./bg/posts')
 const followgraphAPI = require('./bg/followgraph')
@@ -56,6 +58,7 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('history', historyManifest, historyAPI, internalOnly)
   globals.rpcAPI.exportAPI('sitedata', sitedataManifest, sitedataAPI, internalOnly)
   globals.rpcAPI.exportAPI('watchlist', watchlistManifest, watchlistAPI, internalOnly)
+  globals.rpcAPI.exportAPI('templates', templatesManifest, templatesAPI, internalOnly)
   globals.rpcAPI.exportAPI('crawler', crawlerManifest, crawlerAPI, internalOnly)
   globals.rpcAPI.exportAPI('posts', postsManifest, postsAPI, internalOnly)
   globals.rpcAPI.exportAPI('followgraph', followgraphManifest, followgraphAPI, internalOnly)
diff --git a/web-apis/bg/archives.js b/web-apis/bg/archives.js
index 60385262..6432e88c 100644
--- a/web-apis/bg/archives.js
+++ b/web-apis/bg/archives.js
@@ -1,7 +1,6 @@
 const path = require('path')
 const mkdirp = require('mkdirp')
 const jetpack = require('fs-jetpack')
-const templatesDb = require('../../dbs/templates')
 const datDns = require('../../dat/dns')
 const datLibrary = require('../../dat/library')
 const datGC = require('../../dat/garbage-collector')
@@ -266,25 +265,6 @@ module.exports = {
     return archiveDraftsDb.remove(0, masterKey, draftKey)
   },
 
-  // templates
-  // =
-
-  async getTemplate (url) {
-    return templatesDb.get(0, url)
-  },
-
-  async listTemplates () {
-    return templatesDb.list(0)
-  },
-
-  async putTemplate (url, {title, screenshot}) {
-    return templatesDb.put(0, url, {title, screenshot})
-  },
-
-  async removeTemplate (url) {
-    return templatesDb.remove(0, url)
-  },
-
   // internal management
   // =
 
diff --git a/web-apis/bg/templates.js b/web-apis/bg/templates.js
new file mode 100644
index 00000000..3d6c3eca
--- /dev/null
+++ b/web-apis/bg/templates.js
@@ -0,0 +1,22 @@
+const templatesDb = require('../../dbs/templates')
+
+// exported api
+// =
+
+module.exports = {
+  async get (url) {
+    return templatesDb.get(0, url)
+  },
+
+  async list () {
+    return templatesDb.list(0)
+  },
+
+  async put (url, {title, screenshot}) {
+    return templatesDb.put(0, url, {title, screenshot})
+  },
+
+  async remove (url) {
+    return templatesDb.remove(0, url)
+  }
+}
\ No newline at end of file
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index 81c420ad..532b72cf 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -8,6 +8,7 @@ const downloadsManifest = require('../manifests/internal/downloads')
 const historyManifest = require('../manifests/internal/history')
 const sitedataManifest = require('../manifests/internal/sitedata')
 const watchlistManifest = require('../manifests/internal/watchlist')
+const templatesManifest = require('../manifests/internal/templates')
 const crawlerManifest = require('../manifests/internal/crawler')
 const postsManifest = require('../manifests/internal/posts')
 const followgraphManifest = require('../manifests/internal/followgraph')
@@ -25,6 +26,7 @@ exports.setup = function (rpc) {
     const historyRPC = rpc.importAPI('history', historyManifest, opts)
     const sitedataRPC = rpc.importAPI('sitedata', sitedataManifest, opts)
     const watchlistRPC = rpc.importAPI('watchlist', watchlistManifest, opts)
+    const templatesRPC = rpc.importAPI('templates', templatesManifest, opts)
     const crawlerRPC = rpc.importAPI('crawler', crawlerManifest, opts)
     const postsRPC = rpc.importAPI('posts', postsManifest, opts)
     const followgraphRPC = rpc.importAPI('followgraph', followgraphManifest, opts)
@@ -49,10 +51,6 @@ exports.setup = function (rpc) {
     beaker.archives.listDrafts = archivesRPC.listDrafts
     beaker.archives.addDraft = archivesRPC.addDraft
     beaker.archives.removeDraft = archivesRPC.removeDraft
-    beaker.archives.getTemplate = archivesRPC.getTemplate
-    beaker.archives.listTemplates = archivesRPC.listTemplates
-    beaker.archives.putTemplate = archivesRPC.putTemplate
-    beaker.archives.removeTemplate = archivesRPC.removeTemplate
     beaker.archives.touch = archivesRPC.touch
     beaker.archives.clearFileCache = archivesRPC.clearFileCache
     beaker.archives.clearGarbage = archivesRPC.clearGarbage
@@ -160,6 +158,13 @@ exports.setup = function (rpc) {
     beaker.watchlist.remove = watchlistRPC.remove
     beaker.watchlist.createEventsStream = () => fromEventStream(watchlistRPC.createEventsStream())
 
+    // beaker.templates
+    beaker.templates = {}
+    beaker.templates.get = templatesRPC.get
+    beaker.templates.list = templatesRPC.list
+    beaker.templates.put = templatesRPC.put
+    beaker.templates.remove = templatesRPC.remove
+
     // beaker.crawler
     beaker.crawler = {}
     beaker.crawler.getCrawlStates = crawlerRPC.getCrawlStates
diff --git a/web-apis/manifests/internal/archives.js b/web-apis/manifests/internal/archives.js
index 3eb9a6f9..d6eecebc 100644
--- a/web-apis/manifests/internal/archives.js
+++ b/web-apis/manifests/internal/archives.js
@@ -27,12 +27,6 @@ module.exports = {
   addDraft: 'promise',
   removeDraft: 'promise',
 
-  // templates
-  getTemplate: 'promise',
-  listTemplates: 'promise',
-  putTemplate: 'promise',
-  removeTemplate: 'promise',
-
   // internal management
   touch: 'promise',
   clearFileCache: 'promise',
diff --git a/web-apis/manifests/internal/templates.js b/web-apis/manifests/internal/templates.js
new file mode 100644
index 00000000..78500b87
--- /dev/null
+++ b/web-apis/manifests/internal/templates.js
@@ -0,0 +1,6 @@
+module.exports = {
+  get: 'promise',
+  list: 'promise',
+  put: 'promise',
+  remove: 'promise'
+}
\ No newline at end of file

From 76b31898acb62642ef0e6a78362081b254cc3b26 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 23 Dec 2018 18:09:18 -0600
Subject: [PATCH 043/245] Fix limit/offset part of queries

---
 crawler/posts.js             | 12 ++++++------
 crawler/site-descriptions.js | 12 ++++++------
 2 files changed, 12 insertions(+), 12 deletions(-)

diff --git a/crawler/posts.js b/crawler/posts.js
index 32db063a..298d2b84 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -127,17 +127,17 @@ exports.list = async function ({offset, limit, reverse, author} = {}) {
       values.push(a)
     }
   }
-  if (offset) {
-    query += ` OFFSET ?`
-    values.push(offset)
+  query += ` ORDER BY createdAt`
+  if (reverse) {
+    query += ` DESC`
   }
   if (limit) {
     query += ` LIMIT ?`
     values.push(limit)
   }
-  query += ` ORDER BY createdAt`
-  if (reverse) {
-    query += ` DESC`
+  if (offset) {
+    query += ` OFFSET ?`
+    values.push(offset)
   }
 
   // execute query
diff --git a/crawler/site-descriptions.js b/crawler/site-descriptions.js
index d92ac1e4..7e9c18e2 100644
--- a/crawler/site-descriptions.js
+++ b/crawler/site-descriptions.js
@@ -159,17 +159,17 @@ const list = exports.list = async function ({offset, limit, reverse, author, sub
     }
     query += `) `
   }
-  if (offset) {
-    query += ` OFFSET ?`
-    values.push(offset)
+  query += ` ORDER BY createdAt`
+  if (reverse) {
+    query += ` DESC`
   }
   if (limit) {
     query += ` LIMIT ?`
     values.push(limit)
   }
-  query += ` ORDER BY createdAt`
-  if (reverse) {
-    query += ` DESC`
+  if (offset) {
+    query += ` OFFSET ?`
+    values.push(offset)
   }
 
   // execute query

From 1cd71bfe953d4ace8e672abf822555dcf1e498b4 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 23 Dec 2018 18:17:03 -0600
Subject: [PATCH 044/245] Fix {authors} handling of posts.list

---
 crawler/posts.js | 18 +++++++++++-------
 1 file changed, 11 insertions(+), 7 deletions(-)

diff --git a/crawler/posts.js b/crawler/posts.js
index 298d2b84..517c65eb 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -100,17 +100,21 @@ exports.crawlSite = async function (archive, crawlSource) {
   })
 }
 
-exports.list = async function ({offset, limit, reverse, author} = {}) {
+exports.list = async function ({offset, limit, reverse, author, authors} = {}) {
   // validate & parse params
   assert(!offset || typeof offset === 'number', 'Offset must be a number')
   assert(!limit || typeof limit === 'number', 'Limit must be a number')
   assert(!reverse || typeof reverse === 'boolean', 'Reverse must be a boolean')
-  assert(!author || typeof author === 'string' || (Array.isArray(author) && author.every(isString)), 'Author must be a string or an array of strings')
+  assert(!author || typeof author === 'string', 'Author must be a string')
+  assert(!authors || (Array.isArray(authors) && authors.every(isString)), 'Authors must be an array of strings')
 
   if (author) {
-    author = Array.isArray(author) ? author : [author]
-    try { author = author.map(toOrigin) }
-    catch (e) { throw new Error('Author must contain valid URLs') }
+    authors = authors || []
+    authors.push(author)
+  }
+  if (authors) {
+    try { authors = authors.map(toOrigin) }
+    catch (e) { throw new Error('Author/authors must contain valid URLs') }
   }
 
   // build query
@@ -119,9 +123,9 @@ exports.list = async function ({offset, limit, reverse, author} = {}) {
       INNER JOIN crawl_sources src ON src.id = crawl_posts.crawlSourceId
   `
   var values = []
-  if (author) {
+  if (authors) {
     let op = 'WHERE'
-    for (let a of author) {
+    for (let a of authors) {
       query += ` ${op} src.url = ?`
       op = 'OR'
       values.push(a)

From d25d940025d581af99774237051fd6ed6ba5aa1b Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 23 Dec 2018 19:15:47 -0600
Subject: [PATCH 045/245] Add ?disable_fallback_page QP to dat://

---
 dat/protocol.js | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/dat/protocol.js b/dat/protocol.js
index e018d7eb..39fe8847 100644
--- a/dat/protocol.js
+++ b/dat/protocol.js
@@ -262,7 +262,7 @@ exports.electronHandler = async function (request, respond) {
     debug('Entry not found:', urlp.path)
 
     // check for a fallback page
-    if (manifest && manifest.fallback_page) {
+    if (manifest && manifest.fallback_page && !urlp.query.disable_fallback_page) {
       await tryStat(manifest.fallback_page)
     }
 

From 80d945fb66c9c23a19a2ab214c9baaa9988ee984 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 26 Dec 2018 22:41:53 -0600
Subject: [PATCH 046/245] dat:// - look for file extensions based on Accept
 header

---
 dat/protocol.js |  5 ++++-
 lib/mime.js     | 10 ++++++++++
 2 files changed, 14 insertions(+), 1 deletion(-)

diff --git a/dat/protocol.js b/dat/protocol.js
index 39fe8847..6d4c55a3 100644
--- a/dat/protocol.js
+++ b/dat/protocol.js
@@ -213,7 +213,10 @@ exports.electronHandler = async function (request, respond) {
     await tryStat(filepath)
   } else {
     await tryStat(filepath)
-    await tryStat(filepath + '.html') // fallback to .html
+    for (let ext of mime.acceptHeaderExtensions(request.headers.Accept)) {
+      // fallback to different requested headers
+      await tryStat(filepath + ext)
+    }
     if (entry && entry.isDirectory()) {
       // unexpected directory, give the .html fallback a chance
       let dirEntry = entry
diff --git a/lib/mime.js b/lib/mime.js
index 57bb74b3..6b0b6d79 100644
--- a/lib/mime.js
+++ b/lib/mime.js
@@ -63,6 +63,16 @@ exports.isFileContentBinary = async function (fsInstance, filepath) {
   })
 }
 
+// for a given HTTP accept header, provide a list of file-extensions to try
+exports.acceptHeaderExtensions = function (accept) {
+  var exts = []
+  accept = accept.split(',')
+  if (accept.includes('text/html') || (accept.length === 1 && accept[0] === '*/*')) exts.push('.html')
+  if (accept.includes('text/css')) exts.push('.css')
+  if (accept.includes('image/*') || accept.includes('image/apng')) exts = exts.concat(['.png', '.jpg', '.jpeg', '.gif'])
+  return exts
+}
+
 // pulled from https://github.com/gjtorikian/isBinaryFile
 function isBinaryCheck (bytes) {
   var size = bytes.length

From 4e45caa73d9fe913c8f99a88aa6240f4e535dc34 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 1 Jan 2019 12:00:41 -0600
Subject: [PATCH 047/245] Fix exception when no Accept header is set

---
 lib/mime.js | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/lib/mime.js b/lib/mime.js
index 6b0b6d79..7d21e2a9 100644
--- a/lib/mime.js
+++ b/lib/mime.js
@@ -66,7 +66,7 @@ exports.isFileContentBinary = async function (fsInstance, filepath) {
 // for a given HTTP accept header, provide a list of file-extensions to try
 exports.acceptHeaderExtensions = function (accept) {
   var exts = []
-  accept = accept.split(',')
+  accept = (accept || '').split(',')
   if (accept.includes('text/html') || (accept.length === 1 && accept[0] === '*/*')) exts.push('.html')
   if (accept.includes('text/css')) exts.push('.css')
   if (accept.includes('image/*') || accept.includes('image/apng')) exts = exts.concat(['.png', '.jpg', '.jpeg', '.gif'])

From 2bca05f7d7f7bd492fe72ced7a0d90649f7460cb Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 1 Jan 2019 13:11:54 -0600
Subject: [PATCH 048/245] Fix dat download-as-zip

---
 dat/protocol.js   |  4 ++--
 lib/zip.js        | 42 ++++++++++++++++++++++++++++++++++++++++++
 package-lock.json | 19 -------------------
 package.json      |  4 ++--
 4 files changed, 46 insertions(+), 23 deletions(-)
 create mode 100644 lib/zip.js

diff --git a/dat/protocol.js b/dat/protocol.js
index 6d4c55a3..d146a752 100644
--- a/dat/protocol.js
+++ b/dat/protocol.js
@@ -4,7 +4,7 @@ const parseRange = require('range-parser')
 const once = require('once')
 const debug = require('../lib/debug-logger').debugLogger('dat-serve')
 const intoStream = require('into-stream')
-const toZipStream = require('hyperdrive-to-zip-stream')
+const {toZipStream} = require('../lib/zip')
 const slugify = require('slugify')
 
 const datDns = require('./dns')
@@ -173,7 +173,7 @@ exports.electronHandler = async function (request, respond) {
       })
     } else {
       // serve the zip
-      var zs = toZipStream(archive, filepath)
+      var zs = toZipStream(checkoutFS, filepath)
       zs.on('error', err => console.log('Error while producing .zip file', err))
       return respond({
         statusCode: 200,
diff --git a/lib/zip.js b/lib/zip.js
new file mode 100644
index 00000000..ee7cb310
--- /dev/null
+++ b/lib/zip.js
@@ -0,0 +1,42 @@
+const {join} = require('path')
+const yazl = require('yazl')
+
+exports.toZipStream = function (archive, dirpath) {
+  var zipfile = new yazl.ZipFile()
+
+  // create listing stream
+  dirpath = dirpath || '/'
+  archive.pda.readdir(dirpath, {recursive: true}).then(async (paths) => {
+    for (let path of paths) {
+      let readPath = join(dirpath, path)
+
+      // files only
+      try {
+        let entry = await archive.pda.stat(readPath)
+        if (!entry.isFile()) {
+          continue
+        }
+      } catch (e) {
+        // ignore, file must have been removed
+        continue
+      }
+
+      // pipe each entry into the zip
+      console.log('go go go', readPath, path)
+      zipfile.addBuffer(await archive.pda.readFile(readPath, 'binary'), path)
+      // NOTE
+      // for some reason using archive.createReadStream() to feed into the zipfile addReadStream() was not working with multiple files
+      // no idea why, maybe a sign of a bug in the dat-daemon's zip rpc
+      // -prf
+    }
+    zipfile.end()
+  }).catch(onerror)
+
+  // on error, push to the output stream
+  function onerror (e) {
+    console.error('Error while producing zip stream', e)
+    zipfile.outputStream.emit('error', e)
+  }
+
+  return zipfile.outputStream
+}
\ No newline at end of file
diff --git a/package-lock.json b/package-lock.json
index 2133c6cc..c8f5688b 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -1831,17 +1831,6 @@
         }
       }
     },
-    "hyperdrive-to-zip-stream": {
-      "version": "2.1.1",
-      "resolved": "https://registry.npmjs.org/hyperdrive-to-zip-stream/-/hyperdrive-to-zip-stream-2.1.1.tgz",
-      "integrity": "sha512-qHZKedMzgbLLGtY33SRm8J3n2mPCJ3v/Uhyr78W20h9MN99cwhaoKMiH9WpXy9eFCtj/EWFJRoHXqBNOvzNSXw==",
-      "requires": {
-        "from2": "^2.3.0",
-        "pauls-dat-api": "^8.0.1",
-        "through2-concurrent": "^1.1.1",
-        "yazl": "^2.4.2"
-      }
-    },
     "iconv-lite": {
       "version": "0.4.24",
       "resolved": "https://registry.npmjs.org/iconv-lite/-/iconv-lite-0.4.24.tgz",
@@ -3975,14 +3964,6 @@
         "xtend": "~4.0.1"
       }
     },
-    "through2-concurrent": {
-      "version": "1.1.1",
-      "resolved": "https://registry.npmjs.org/through2-concurrent/-/through2-concurrent-1.1.1.tgz",
-      "integrity": "sha1-EctOpMnjG8puTB5tukjRxyjDUks=",
-      "requires": {
-        "through2": "^2.0.0"
-      }
-    },
     "thunky": {
       "version": "0.1.0",
       "resolved": "http://registry.npmjs.org/thunky/-/thunky-0.1.0.tgz",
diff --git a/package.json b/package.json
index 502fd75f..7f72977f 100644
--- a/package.json
+++ b/package.json
@@ -47,7 +47,6 @@
     "hypercore-protocol": "^6.9.0",
     "hyperdrive": "^9.14.0",
     "hyperdrive-network-speed": "^2.1.0",
-    "hyperdrive-to-zip-stream": "^2.1.1",
     "identify-filetype": "^1.0.0",
     "into-stream": "^3.1.0",
     "lodash.debounce": "^4.0.8",
@@ -81,7 +80,8 @@
     "supports-sparse-files": "^1.0.2",
     "textextensions": "^2.4.0",
     "through2": "^2.0.5",
-    "utp-native": "^2.1.3"
+    "utp-native": "^2.1.3",
+    "yazl": "^2.5.1"
   },
   "devDependencies": {
     "eslint": "^4.19.1",

From a8453d089d81f7d44174404ce08bd5d8386f3dcf Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 3 Jan 2019 17:16:38 -0600
Subject: [PATCH 049/245] Add beaker.crawler.listSuggestions

---
 crawler/index.js                       |  1 +
 crawler/search.js                      | 49 ++++++++++++++++++++++++++
 web-apis/fg/beaker.js                  |  1 +
 web-apis/manifests/internal/crawler.js |  1 +
 4 files changed, 52 insertions(+)
 create mode 100644 crawler/search.js

diff --git a/crawler/index.js b/crawler/index.js
index 8e997cb2..799af9a0 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -126,6 +126,7 @@ exports.resetSite = async function (url) {
 }
 
 exports.WEBAPI = {
+  listSuggestions: require('./search').listSuggestions,
   createEventsStream,
   getCrawlStates,
   crawlSite: async (url) => {
diff --git a/crawler/search.js b/crawler/search.js
new file mode 100644
index 00000000..a3bd85f4
--- /dev/null
+++ b/crawler/search.js
@@ -0,0 +1,49 @@
+const bookmarksDb = require('../dbs/bookmarks')
+const historyDb = require('../dbs/history')
+const datLibrary = require('../dat/library')
+
+const BUILTIN_PAGES = [
+  {title: 'Feed', url: 'beaker://feed'},
+  {title: 'Library', url: 'beaker://library'},
+  {title: 'Search', url: 'beaker://search'},
+  {title: 'Bookmarks', url: 'beaker://bookmarks'},
+  {title: 'History', url: 'beaker://history'},
+  {title: 'Watchlist', url: 'beaker://watchlist'},
+  {title: 'Downloads', url: 'beaker://downloads'},
+  {title: 'Settings', url: 'beaker://settings'},
+]
+
+// exported api
+// =
+
+exports.listSuggestions = async function (query = '', opts = {}) {
+  var suggestions = {}
+  const filterFn = a => ((a.url || a.href).includes(query) || a.title.toLowerCase().includes(query))
+
+  // builtin pages
+  suggestions.apps = BUILTIN_PAGES.filter(filterFn)
+
+  // bookmarks
+  var bookmarkResults = await bookmarksDb.listBookmarks(0)
+  if (opts.filterPins) {
+    bookmarkResults = bookmarkResults.filter(b => !b.pinned && filterFn(b))
+  } else {
+    bookmarkResults = bookmarkResults.filter(filterFn)
+  }
+  bookmarkResults = bookmarkResults.slice(0, 12)
+  suggestions.bookmarks = bookmarkResults.map(b => ({title: b.title, url: b.href}))
+
+  // library
+  var libraryResults = await datLibrary.queryArchives({isSaved: true})
+  libraryResults = libraryResults.filter(filterFn)
+  suggestions.library = libraryResults.slice(0, 12)
+
+  // fetch history
+  if (query) {
+    var historyResults = await historyDb.search(query)
+    suggestions.history = historyResults.slice(0, 12)
+    suggestions.history.sort((a, b) => a.url.length - b.url.length) // shorter urls at top
+  }
+
+  return suggestions
+}
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index 532b72cf..80a5f7ea 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -167,6 +167,7 @@ exports.setup = function (rpc) {
 
     // beaker.crawler
     beaker.crawler = {}
+    beaker.crawler.listSuggestions = crawlerRPC.listSuggestions
     beaker.crawler.getCrawlStates = crawlerRPC.getCrawlStates
     beaker.crawler.crawlSite = crawlerRPC.crawlSite
     beaker.crawler.resetSite = crawlerRPC.resetSite
diff --git a/web-apis/manifests/internal/crawler.js b/web-apis/manifests/internal/crawler.js
index 47365431..2cd65b21 100644
--- a/web-apis/manifests/internal/crawler.js
+++ b/web-apis/manifests/internal/crawler.js
@@ -1,4 +1,5 @@
 module.exports = {
+  listSuggestions: 'promise',
   getCrawlStates: 'promise',
   crawlSite: 'promise',
   resetSite: 'promise',

From 07d703f8d64b1d837c3f58de2af7ff14d451cc95 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 4 Jan 2019 12:21:33 -0600
Subject: [PATCH 050/245] Rename feed -> timeline

---
 crawler/search.js | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/crawler/search.js b/crawler/search.js
index a3bd85f4..a8b86136 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -3,7 +3,7 @@ const historyDb = require('../dbs/history')
 const datLibrary = require('../dat/library')
 
 const BUILTIN_PAGES = [
-  {title: 'Feed', url: 'beaker://feed'},
+  {title: 'Timeline', url: 'beaker://timeline'},
   {title: 'Library', url: 'beaker://library'},
   {title: 'Search', url: 'beaker://search'},
   {title: 'Bookmarks', url: 'beaker://bookmarks'},

From d42556b24e7560867a09b4601c25aa5b6f4c2114 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 4 Jan 2019 13:51:55 -0600
Subject: [PATCH 051/245] Split search results into types

---
 crawler/search.js | 26 ++++++++++++++------------
 lib/dat.js        |  9 +++++++++
 package-lock.json |  5 +++++
 package.json      |  1 +
 4 files changed, 29 insertions(+), 12 deletions(-)
 create mode 100644 lib/dat.js

diff --git a/crawler/search.js b/crawler/search.js
index a8b86136..9b6aa307 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -1,6 +1,8 @@
+const _groupBy = require('lodash.groupby')
 const bookmarksDb = require('../dbs/bookmarks')
 const historyDb = require('../dbs/history')
 const datLibrary = require('../dat/library')
+const {getBasicType} = require('../lib/dat')
 
 const BUILTIN_PAGES = [
   {title: 'Timeline', url: 'beaker://timeline'},
@@ -23,23 +25,23 @@ exports.listSuggestions = async function (query = '', opts = {}) {
   // builtin pages
   suggestions.apps = BUILTIN_PAGES.filter(filterFn)
 
-  // bookmarks
-  var bookmarkResults = await bookmarksDb.listBookmarks(0)
-  if (opts.filterPins) {
-    bookmarkResults = bookmarkResults.filter(b => !b.pinned && filterFn(b))
-  } else {
-    bookmarkResults = bookmarkResults.filter(filterFn)
-  }
-  bookmarkResults = bookmarkResults.slice(0, 12)
-  suggestions.bookmarks = bookmarkResults.map(b => ({title: b.title, url: b.href}))
-
   // library
   var libraryResults = await datLibrary.queryArchives({isSaved: true})
   libraryResults = libraryResults.filter(filterFn)
-  suggestions.library = libraryResults.slice(0, 12)
+  Object.assign(suggestions, _groupBy(libraryResults, a => getBasicType(a.type)))
 
-  // fetch history
   if (query) {
+    // bookmarks
+    var bookmarkResults = await bookmarksDb.listBookmarks(0)
+    if (opts.filterPins) {
+      bookmarkResults = bookmarkResults.filter(b => !b.pinned && filterFn(b))
+    } else {
+      bookmarkResults = bookmarkResults.filter(filterFn)
+    }
+    bookmarkResults = bookmarkResults.slice(0, 12)
+    suggestions.bookmarks = bookmarkResults.map(b => ({title: b.title, url: b.href}))
+
+    // history
     var historyResults = await historyDb.search(query)
     suggestions.history = historyResults.slice(0, 12)
     suggestions.history.sort((a, b) => a.url.length - b.url.length) // shorter urls at top
diff --git a/lib/dat.js b/lib/dat.js
new file mode 100644
index 00000000..0aaef3cc
--- /dev/null
+++ b/lib/dat.js
@@ -0,0 +1,9 @@
+exports.getBasicType = function (type) {
+  if (type && Array.isArray(type)) {
+    if (type.includes('user')) return 'user'
+    if (type.includes('web-page')) return 'web-page'
+    if (type.includes('file-share')) return 'file-share'
+    if (type.includes('image-collection')) return 'image-collection'
+  }
+  return 'other'
+}
diff --git a/package-lock.json b/package-lock.json
index c8f5688b..f6b7944f 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -2325,6 +2325,11 @@
       "resolved": "https://registry.npmjs.org/lodash.get/-/lodash.get-4.4.2.tgz",
       "integrity": "sha1-LRd/ZS+jHpObRDjVNBSZ36OCXpk="
     },
+    "lodash.groupby": {
+      "version": "4.6.0",
+      "resolved": "https://registry.npmjs.org/lodash.groupby/-/lodash.groupby-4.6.0.tgz",
+      "integrity": "sha1-Cwih3PaDl8OXhVwyOXg4Mt90A9E="
+    },
     "lodash.isequal": {
       "version": "4.5.0",
       "resolved": "https://registry.npmjs.org/lodash.isequal/-/lodash.isequal-4.5.0.tgz",
diff --git a/package.json b/package.json
index 7f72977f..18ef8ddd 100644
--- a/package.json
+++ b/package.json
@@ -52,6 +52,7 @@
     "lodash.debounce": "^4.0.8",
     "lodash.difference": "^4.5.0",
     "lodash.get": "^4.4.2",
+    "lodash.groupby": "^4.6.0",
     "lodash.isequal": "^4.5.0",
     "lodash.pick": "^4.4.0",
     "lodash.throttle": "^4.1.1",

From 5763d0c3ae19c774fb76acf809d1b70be46b197a Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 10 Jan 2019 16:27:14 -0600
Subject: [PATCH 052/245] Add beaker.crawler.listSearchResults and FTS indexes

---
 crawler/index.js                       |   1 +
 crawler/search.js                      | 235 ++++++++++++++++++++++++-
 dbs/profile-data-db.js                 |   3 +-
 dbs/schemas/profile-data.sql.js        |  28 ++-
 dbs/schemas/profile-data.v25.sql.js    |  32 ++++
 package-lock.json                      |   5 +
 package.json                           |   1 +
 web-apis/fg/beaker.js                  |   1 +
 web-apis/manifests/internal/crawler.js |   1 +
 9 files changed, 303 insertions(+), 4 deletions(-)
 create mode 100644 dbs/schemas/profile-data.v25.sql.js

diff --git a/crawler/index.js b/crawler/index.js
index 799af9a0..ef27b57f 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -127,6 +127,7 @@ exports.resetSite = async function (url) {
 
 exports.WEBAPI = {
   listSuggestions: require('./search').listSuggestions,
+  listSearchResults: require('./search').listSearchResults,
   createEventsStream,
   getCrawlStates,
   crawlSite: async (url) => {
diff --git a/crawler/search.js b/crawler/search.js
index 9b6aa307..6c92b7db 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -1,12 +1,17 @@
 const _groupBy = require('lodash.groupby')
+const _uniqWith = require('lodash.uniqwith')
+const db = require('../dbs/profile-data-db')
 const bookmarksDb = require('../dbs/bookmarks')
 const historyDb = require('../dbs/history')
 const datLibrary = require('../dat/library')
+const followgraph = require('./followgraph')
+const siteDescriptions = require('./site-descriptions')
 const {getBasicType} = require('../lib/dat')
 
+/** @type {Array<Object>} */
 const BUILTIN_PAGES = [
   {title: 'Timeline', url: 'beaker://timeline'},
-  {title: 'Library', url: 'beaker://library'},
+  {title: 'Your Library', url: 'beaker://library'},
   {title: 'Search', url: 'beaker://search'},
   {title: 'Bookmarks', url: 'beaker://bookmarks'},
   {title: 'History', url: 'beaker://history'},
@@ -15,9 +20,33 @@ const BUILTIN_PAGES = [
   {title: 'Settings', url: 'beaker://settings'},
 ]
 
+// typedefs
+// =
+
 // exported api
 // =
 
+/**
+ * @description
+ * Get suggested content of various types.
+ *
+ * @param {string} [query=''] - The search query.
+ * @param {Object} [opts={}]
+ * @param {boolean} [opts.filterPins] - If true, will filter out pinned bookmarks.
+ * @returns {Promise<SuggestionResults>}
+ *
+ * @typedef {Object} SuggestionResults
+ * @prop {Array<Object>} apps
+ * @prop {Array<Object>} people
+ * @prop {Array<Object>} webPages
+ * @prop {Array<Object>} fileShares
+ * @prop {Array<Object>} imageCollections
+ * @prop {Array<Object>} others
+ * @prop {(undefined|Array<Object>)} bookmarks
+ * @prop {(undefined|Array<Object>)} history
+ *
+ * TODO: make the return values much more concrete
+ */
 exports.listSuggestions = async function (query = '', opts = {}) {
   var suggestions = {}
   const filterFn = a => ((a.url || a.href).includes(query) || a.title.toLowerCase().includes(query))
@@ -28,7 +57,12 @@ exports.listSuggestions = async function (query = '', opts = {}) {
   // library
   var libraryResults = await datLibrary.queryArchives({isSaved: true})
   libraryResults = libraryResults.filter(filterFn)
-  Object.assign(suggestions, _groupBy(libraryResults, a => getBasicType(a.type)))
+  libraryResults = _groupBy(libraryResults, a => getBasicType(a.type))
+  suggestions.people = libraryResults.user
+  suggestions.webPages = libraryResults['web-page']
+  suggestions.fileShares = libraryResults['file-share']
+  suggestions.imageCollections = libraryResults['image-collection']
+  suggestions.others = libraryResults.other
 
   if (query) {
     // bookmarks
@@ -49,3 +83,200 @@ exports.listSuggestions = async function (query = '', opts = {}) {
 
   return suggestions
 }
+
+/**
+ * @description
+ * Run a search query against crawled data.
+ *
+ * @param {Object} opts
+ * @param {string} opts.user - The current user's URL.
+ * @param {string} [opts.query] - The search query.
+ * @param {number} [opts.hops=1] - How many hops out in the user's follow graph should be included?
+ * @param {Object} [opts.types] - Content types to query. Defaults to all.
+ * @param {boolean} [opts.types.people]
+ * @param {boolean} [opts.types.posts]
+ * @param {number} [opts.since] - Filter results to items created since the given timestamp.
+ * @param {number} [opts.offset]
+ * @param {number} [opts.limit = 20]
+ * @returns {Promise<SearchResults>}
+ *
+ * Search results:
+ * @typedef {Object} SearchResults
+ * @prop {number} highlightNonce - A number used to create perimeters around text that should be highlighted.
+ * @prop {(null|Array<PeopleSearchResult>)} people
+ * @prop {(null|Array<PostSearchResult>)} posts
+ *
+ * People search results:
+ * @typedef {Object} PeopleSearchResult
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {Array<SiteDescription>} followedBy
+ * @prop {bool} followsUser
+ * @prop {Object} author
+ * @prop {string} author.url
+ *
+ * Post search results:
+ * @typedef {Object} PostSearchResult
+ * @prop {string} url
+ * @prop {SiteDescription} author
+ * @prop {string} content
+ * @prop {string} createdAt
+ * @prop {string} [updatedAt]
+ *
+ * Site description objects:
+ * @typedef {Object} SiteDescription
+ * @prop {string} url
+ * @prop {string} [title]
+ * @prop {string} [description]
+ * @prop {Array<string>} [type]
+ * @prop {Object} [author]
+ * @prop {string} [author.url]
+ */
+exports.listSearchResults = async function (opts) {
+  const highlightNonce =  (Math.random() * 1e3)|0
+  const startHighlight = `{${highlightNonce}}`
+  const endHighlight = `{/${highlightNonce}}`
+
+  var searchResults = {
+    highlightNonce,
+    people: null,
+    posts: null
+  }
+  var {user, query, hops, types, since, offset, limit} = opts
+  if (!types || typeof types !== 'object') {
+    types = {people: true, posts: true}
+  }
+  since = since || 0
+  offset = offset || 0
+  limit = limit || 20
+  hops = Math.min(Math.max(Math.floor(hops), 1), 2) // clamp to [1, 2] for now
+
+  // prep search terms
+  if (query && typeof query === 'string') {
+    query = query
+      .toLowerCase() // all lowercase. (uppercase is interpretted as a directive by sqlite.)
+      .replace(/[:^*\.]/g, ' ') // strip symbols that sqlite interprets.
+    query += '*' // match prefixes
+  }
+
+  // get user's crawl_source id
+  var userCrawlSourceId
+  {
+    let res = await db.get(`SELECT id FROM crawl_sources WHERE url = ?`, [user])
+    userCrawlSourceId = res.id
+  }
+
+  // construct set of crawl sources to query
+  var crawlSourceIds
+  if (hops === 2) {
+    // the user and all followed sources
+    let res = await db.all(`
+      SELECT id FROM crawl_sources src
+        INNER JOIN crawl_followgraph fgraph ON fgraph.destUrl = src.url AND fgraph.crawlSourceId = ?
+    `, [userCrawlSourceId])
+    crawlSourceIds = [userCrawlSourceId].concat(res.map(({id}) => id))
+  } else if (hops === 1) {
+    // just the user
+    crawlSourceIds = [userCrawlSourceId]
+  }
+
+  // run queries
+  if (types.people) {
+    if (query) {
+      searchResults.people = await db.all(`
+        SELECT
+            desc.subject AS url,
+            descSrc.url AS authorUrl,
+            SNIPPET(crawl_site_descriptions_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title,
+            SNIPPET(crawl_site_descriptions_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description
+          FROM crawl_site_descriptions_fts_index desc_fts
+          INNER JOIN crawl_site_descriptions desc ON desc.rowid = desc_fts.rowid
+          INNER JOIN crawl_followgraph fgraph ON fgraph.destUrl = desc.subject AND fgraph.crawlSourceId IN (${crawlSourceIds.join(',')})
+          INNER JOIN crawl_sources descSrc ON desc.crawlSourceId = descSrc.id
+          WHERE crawl_site_descriptions_fts_index MATCH ?
+          ORDER BY rank
+          LIMIT ?
+          OFFSET ?;
+      `, [query, limit, offset])
+    } else {
+      searchResults.people = await db.all(`
+        SELECT desc.subject AS url, desc.title, desc.description, descSrc.url AS authorUrl
+          FROM crawl_site_descriptions desc
+          INNER JOIN crawl_followgraph fgraph ON fgraph.destUrl = desc.subject AND fgraph.crawlSourceId IN (${crawlSourceIds.join(',')})
+          INNER JOIN crawl_sources descSrc ON desc.crawlSourceId = descSrc.id
+          ORDER BY desc.createdAt
+          LIMIT ?
+          OFFSET ?;
+      `, [limit, offset])      
+    }
+    searchResults.people = _uniqWith(searchResults.people, (a, b) => a.url === b.url)
+    await Promise.all(searchResults.people.map(async (p) => {
+      // fetch additional info
+      p.followedBy = await followgraph.listFollowers(p.url, {includeDesc: true})
+      p.followsUser = await followgraph.isAFollowingB(p.url, user)
+
+      // massage attrs
+      p.author = {url: p.authorUrl}
+      delete p.authorUrl
+    }))
+  }
+  if (types.posts) {
+    if (query) {
+      searchResults.posts = await db.all(`
+        SELECT
+            SNIPPET(crawl_posts_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS content,
+            post.pathname,
+            post.createdAt,
+            post.updatedAt,
+            postSrc.url AS authorUrl
+          FROM crawl_posts_fts_index post_fts
+          INNER JOIN crawl_posts post ON post.rowid = post_fts.rowid
+          INNER JOIN crawl_sources postSrc ON post.crawlSourceId = postSrc.id
+          LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = postSrc.url 
+          WHERE
+            crawl_posts_fts_index MATCH ?
+            AND (fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) OR post.crawlSourceId = ?)
+            AND post.createdAt >= ?
+          ORDER BY rank
+          LIMIT ?
+          OFFSET ?;
+      `, [query, userCrawlSourceId, since, limit, offset])
+    } else {
+      searchResults.posts = await db.all(`
+        SELECT post.content, post.pathname, post.createdAt, post.updatedAt, postSrc.url AS authorUrl
+          FROM crawl_posts post
+          INNER JOIN crawl_sources postSrc ON post.crawlSourceId = postSrc.id
+          LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = postSrc.url 
+          WHERE
+            (fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) OR post.crawlSourceId = ?)
+            AND post.createdAt >= ?
+          ORDER BY post.createdAt DESC
+          LIMIT ?
+          OFFSET ?;
+      `, [userCrawlSourceId, since, limit, offset])      
+    }
+    await Promise.all(searchResults.posts.map(async (p) => {
+      // fetch additional info
+      p.author = await siteDescriptions.getBest({subject: p.authorUrl})
+
+      // massage attrs
+      p.url = p.authorUrl + p.pathname
+      delete p.authorUrl
+      delete p.pathname
+    }))
+    // TODO hops == 2
+    /*searchResults.posts = await db.all(`
+      SELECT post.content, post.pathname, postSrc.url
+        FROM crawl_posts post
+        INNER JOIN crawl_sources postSrc ON post.crawlSourceId = postSrc.id
+        INNER JOIN crawl_followgraph fgraph ON fgraph.destUrl = postSrc.url AND fgraph.crawlSourceId = ?
+        WHERE (post.content MATCH ?) AND (post.createdAt >= ?)
+        ORDER BY rank
+        LIMIT ?
+        OFFSET ?;
+    `, [userCrawlSourceId, query, since, offset, limit])*/
+  }
+  
+  return searchResults
+}
diff --git a/dbs/profile-data-db.js b/dbs/profile-data-db.js
index a4c919b4..542ea376 100644
--- a/dbs/profile-data-db.js
+++ b/dbs/profile-data-db.js
@@ -79,7 +79,8 @@ migrations = [
   migration('profile-data.v21.sql'),
   migration('profile-data.v22.sql', {canFail: true}), // canFail for the same reason as v16, ffs
   migration('profile-data.v23.sql'),
-  migration('profile-data.v24.sql')
+  migration('profile-data.v24.sql'),
+  migration('profile-data.v25.sql')
 ]
 function migration (file, opts = {}) {
   return cb => {
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index 3879146e..f59bada2 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -144,6 +144,19 @@ CREATE TABLE crawl_site_descriptions (
   PRIMARY KEY (crawlSourceId, pathname),
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
+CREATE VIRTUAL TABLE crawl_site_descriptions_fts_index USING fts5(title, description, content='crawl_site_descriptions');
+
+-- triggers to keep crawl_site_descriptions_fts_index updated
+CREATE TRIGGER crawl_site_descriptions_ai AFTER INSERT ON crawl_site_descriptions BEGIN
+  INSERT INTO crawl_site_descriptions_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
+END;
+CREATE TRIGGER crawl_site_descriptions_ad AFTER DELETE ON crawl_site_descriptions BEGIN
+  INSERT INTO crawl_site_descriptions_fts_index(crawl_site_descriptions_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
+END;
+CREATE TRIGGER crawl_site_descriptions_au AFTER UPDATE ON crawl_site_descriptions BEGIN
+  INSERT INTO crawl_site_descriptions_fts_index(crawl_site_descriptions_fts_index, rowid, title, description) VALUES('delete', old.a, old.title, old.description);
+  INSERT INTO crawl_site_descriptions_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
+END;
 
 -- crawled posts
 CREATE TABLE crawl_posts (
@@ -157,6 +170,19 @@ CREATE TABLE crawl_posts (
 
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
+CREATE VIRTUAL TABLE crawl_posts_fts_index USING fts5(content, content='crawl_posts');
+
+-- triggers to keep crawl_posts_fts_index updated
+CREATE TRIGGER crawl_posts_ai AFTER INSERT ON crawl_posts BEGIN
+  INSERT INTO crawl_posts_fts_index(rowid, content) VALUES (new.rowid, new.content);
+END;
+CREATE TRIGGER crawl_posts_ad AFTER DELETE ON crawl_posts BEGIN
+  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, content) VALUES('delete', old.rowid, old.content);
+END;
+CREATE TRIGGER crawl_posts_au AFTER UPDATE ON crawl_posts BEGIN
+  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, content) VALUES('delete', old.rowid, old.content);
+  INSERT INTO crawl_posts_fts_index(rowid, content) VALUES (new.rowid, new.content);
+END;
 
 -- crawled follows
 CREATE TABLE crawl_followgraph (
@@ -232,5 +258,5 @@ INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Report an issu
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Explore the p2p Web', 'dat://taravancil.com/explore-the-p2p-web.md', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker', 'https://opencollective.com/beaker', 1);
 
-PRAGMA user_version = 24;
+PRAGMA user_version = 25;
 `
diff --git a/dbs/schemas/profile-data.v25.sql.js b/dbs/schemas/profile-data.v25.sql.js
new file mode 100644
index 00000000..b84e73a1
--- /dev/null
+++ b/dbs/schemas/profile-data.v25.sql.js
@@ -0,0 +1,32 @@
+module.exports = `
+
+-- add full-text search indexes
+CREATE VIRTUAL TABLE crawl_site_descriptions_fts_index USING fts5(title, description, content='crawl_site_descriptions');
+CREATE VIRTUAL TABLE crawl_posts_fts_index USING fts5(content, content='crawl_posts');
+
+-- triggers to keep crawl_site_descriptions_fts_index updated
+CREATE TRIGGER crawl_site_descriptions_ai AFTER INSERT ON crawl_site_descriptions BEGIN
+  INSERT INTO crawl_site_descriptions_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
+END;
+CREATE TRIGGER crawl_site_descriptions_ad AFTER DELETE ON crawl_site_descriptions BEGIN
+  INSERT INTO crawl_site_descriptions_fts_index(crawl_site_descriptions_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
+END;
+CREATE TRIGGER crawl_site_descriptions_au AFTER UPDATE ON crawl_site_descriptions BEGIN
+  INSERT INTO crawl_site_descriptions_fts_index(crawl_site_descriptions_fts_index, rowid, title, description) VALUES('delete', old.a, old.title, old.description);
+  INSERT INTO crawl_site_descriptions_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
+END;
+
+-- triggers to keep crawl_posts_fts_index updated
+CREATE TRIGGER crawl_posts_ai AFTER INSERT ON crawl_posts BEGIN
+  INSERT INTO crawl_posts_fts_index(rowid, content) VALUES (new.rowid, new.content);
+END;
+CREATE TRIGGER crawl_posts_ad AFTER DELETE ON crawl_posts BEGIN
+  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, content) VALUES('delete', old.rowid, old.content);
+END;
+CREATE TRIGGER crawl_posts_au AFTER UPDATE ON crawl_posts BEGIN
+  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, content) VALUES('delete', old.rowid, old.content);
+  INSERT INTO crawl_posts_fts_index(rowid, content) VALUES (new.rowid, new.content);
+END;
+
+PRAGMA user_version = 25;
+`
\ No newline at end of file
diff --git a/package-lock.json b/package-lock.json
index f6b7944f..abce505b 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -2345,6 +2345,11 @@
       "resolved": "https://registry.npmjs.org/lodash.throttle/-/lodash.throttle-4.1.1.tgz",
       "integrity": "sha1-wj6RtxAkKscMN/HhzaknTMOb8vQ="
     },
+    "lodash.uniqwith": {
+      "version": "4.5.0",
+      "resolved": "https://registry.npmjs.org/lodash.uniqwith/-/lodash.uniqwith-4.5.0.tgz",
+      "integrity": "sha1-egy/ZfQ7WShiWp1NDcVLGMrcfvM="
+    },
     "lru": {
       "version": "3.1.0",
       "resolved": "https://registry.npmjs.org/lru/-/lru-3.1.0.tgz",
diff --git a/package.json b/package.json
index 18ef8ddd..f933fb4a 100644
--- a/package.json
+++ b/package.json
@@ -56,6 +56,7 @@
     "lodash.isequal": "^4.5.0",
     "lodash.pick": "^4.4.0",
     "lodash.throttle": "^4.1.1",
+    "lodash.uniqwith": "^4.5.0",
     "mime": "^1.4.0",
     "mkdirp": "^0.5.1",
     "moment": "^2.23.0",
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index 80a5f7ea..819a0ec3 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -168,6 +168,7 @@ exports.setup = function (rpc) {
     // beaker.crawler
     beaker.crawler = {}
     beaker.crawler.listSuggestions = crawlerRPC.listSuggestions
+    beaker.crawler.listSearchResults = crawlerRPC.listSearchResults
     beaker.crawler.getCrawlStates = crawlerRPC.getCrawlStates
     beaker.crawler.crawlSite = crawlerRPC.crawlSite
     beaker.crawler.resetSite = crawlerRPC.resetSite
diff --git a/web-apis/manifests/internal/crawler.js b/web-apis/manifests/internal/crawler.js
index 2cd65b21..af7554a2 100644
--- a/web-apis/manifests/internal/crawler.js
+++ b/web-apis/manifests/internal/crawler.js
@@ -1,5 +1,6 @@
 module.exports = {
   listSuggestions: 'promise',
+  listSearchResults: 'promise',
   getCrawlStates: 'promise',
   crawlSite: 'promise',
   resetSite: 'promise',

From 8bab9d1bf29d716ddbe3c7cb45de552906a27bb2 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 11 Jan 2019 17:33:17 -0600
Subject: [PATCH 053/245] Update the known_sites implementation to use
 folder-based captures and to index self-descriptions. Also added a lot of
 jsdocs to the crawler.

---
 crawler/followgraph.js              | 107 +++++++++---
 crawler/index.js                    |   1 +
 crawler/posts.js                    | 100 +++++++++++-
 crawler/search.js                   | 119 +++++++-------
 crawler/site-descriptions.js        | 244 ++++++++++++++++------------
 crawler/util.js                     |  65 +++++++-
 dbs/profile-data-db.js              |   3 +-
 dbs/schemas/profile-data.sql.js     |   7 +-
 dbs/schemas/profile-data.v24.sql.js |  30 +++-
 dbs/schemas/profile-data.v25.sql.js |  32 ----
 10 files changed, 475 insertions(+), 233 deletions(-)
 delete mode 100644 dbs/schemas/profile-data.v25.sql.js

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index 0340117d..7f967e2e 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -16,6 +16,19 @@ const TABLE_VERSION = 1
 const JSON_TYPE = 'unwalled.garden/follows'
 const JSON_PATH = '/data/follows.json'
 
+// typedefs
+// =
+
+/**
+ * @typedef CrawlSourceRecord {import('./util').CrawlSourceRecord}
+ * @typedef SiteDescription {import('./site-descriptions').SiteDescription}
+ *
+ * @typedef {Object} SiteDescriptionWithFollowData
+ * @extends {SiteDescription}
+ * @prop {boolean} [followsUser] - does this site follow the specified user site?
+ * @prop {Array<SiteDescription>} [followedBy] - list of sites following this site.
+ */
+
 // globals
 // =
 
@@ -28,6 +41,14 @@ exports.on = events.on.bind(events)
 exports.addListener = events.addListener.bind(events)
 exports.removeListener = events.removeListener.bind(events)
 
+/**
+ * @description
+ * Crawl the given site for follows.
+ *
+ * @param {InternalDatArchive} archive - site to crawl.
+ * @param {CrawlSourceRecord} crawlSource - internal metadata about the crawl target.
+ * @returns {Promise}
+ */
 exports.crawlSite = async function (archive, crawlSource) {
   return doCrawl(archive, crawlSource, 'crawl_followgraph', TABLE_VERSION, async ({changes, resetRequired}) => {
     const supressEvents = resetRequired === true // dont emit when replaying old info
@@ -97,11 +118,16 @@ exports.crawlSite = async function (archive, crawlSource) {
   })
 }
 
-// List sites that follow subject
-// - subject. String (URL).
-// - opts.followedBy. String (URL).
-// - opts.includeDesc. Boolean.
-// - returns Array<String | Object>
+/**
+ * @description
+ * List sites that follow subject.
+ *
+ * @param {string} subject - (URL)
+ * @param {Object} [opts]
+ * @param {string} [opts.followedBy] - (URL) filter results to those followed by the site specified with this param. Causes .followsUser boolean to be set.
+ * @param {boolean} [opts.includeDesc] - output a site description instead of a simple URL.
+ * @returns {(Promise<Array<string>>|Promise<Array<SiteDescriptionWithFollowData>>)}
+ */
 const listFollowers = exports.listFollowers = async function (subject, {followedBy, includeDesc} = {}) {
   var rows
   if (followedBy) {
@@ -138,12 +164,17 @@ const listFollowers = exports.listFollowers = async function (subject, {followed
   }))
 }
 
-// List sites that subject follows
-// - subject. String (URL).
-// - opts.followedBy. String (URL). Filters to users who are followed by the URL specified. Causes .followsUser boolean to be set.
-// - opts.includeDesc. Boolean.
-// - opts.includeFollowers. Boolean. Requires includeDesc to be true.
-// - returns Array<String | Object>
+/**
+ * @description
+ * List sites that subject follows.
+ *
+ * @param {string} subject - (URL)
+ * @param {Object} [opts]
+ * @param {string} [opts.followedBy] - (URL) filter results to those followed by the site specified with this param. Causes .followsUser boolean to be set.
+ * @param {boolean} [opts.includeDesc] - output a site description instead of a simple URL.
+ * @param {boolean} [opts.includeFollowers] - include .followedBy in the result. Requires includeDesc to be true.
+ * @returns {(Promise<Array<string>>|Promise<Array<SiteDescriptionWithFollowData>>)}
+ */
 const listFollows = exports.listFollows = async function (subject, {followedBy, includeDesc, includeFollowers} = {}) {
   var rows = await db.all(`
     SELECT crawl_followgraph.destUrl
@@ -169,10 +200,15 @@ const listFollows = exports.listFollows = async function (subject, {followedBy,
   }))
 }
 
-// List sites that are followed by sites that the subject follows
-// - subject. String (URL).
-// - opts.followedBy. String (URL). Filters to users who are followed by the URL specified. Causes .followsUser boolean to be set.
-// - returns Array<Object>
+/**
+ * @description
+ * List sites that are followed by sites that the subject follows.
+ *
+ * @param {string} subject - (URL)
+ * @param {Object} [opts]
+ * @param {string} [opts.followedBy] - (URL) filter results to those followed by the site specified with this param. Causes .followsUser boolean to be set.
+ * @returns {Promise<Array<SiteDescriptionWithFollowData>>}
+ */
 const listFoaFs = exports.listFoaFs = async function (subject, {followedBy} = {}) {
   var foafs = []
   // list URLs followed by subject
@@ -196,10 +232,14 @@ const listFoaFs = exports.listFoaFs = async function (subject, {followedBy} = {}
   return foafs
 }
 
-// Check for the existence of an individual follow
-// - a. String (URL), the site being queried.
-// - b. String (URL), does a follow this site?
-// - returns bool
+/**
+ * @description
+ * Check for the existence of an individual follow.
+ *
+ * @param {string} a - (URL) the site being queried.
+ * @param {string} b - (URL) does a follow this site?
+ * @returns {Promise<boolean>}
+ */
 const isAFollowingB = exports.isAFollowingB = async function (a, b) {
   a = toOrigin(a)
   b = toOrigin(b)
@@ -214,6 +254,14 @@ const isAFollowingB = exports.isAFollowingB = async function (a, b) {
   return !!res
 }
 
+/**
+ * @description
+ * Add a follow to the given archive.
+ *
+ * @param {InternalDatArchive} archive
+ * @param {string} followUrl
+ * @returns {Promise}
+ */
 exports.follow = async function (archive, followUrl) {
   // normalize followUrl
   followUrl = toOrigin(followUrl)
@@ -230,6 +278,14 @@ exports.follow = async function (archive, followUrl) {
   /* dont await */siteDescriptions.capture(archive, followUrl)
 }
 
+/**
+ * @description
+ * Remove a follow from the given archive.
+ *
+ * @param {InternalDatArchive} archive
+ * @param {string} followUrl
+ * @returns {Promise}
+ */
 exports.unfollow = async function (archive, followUrl) {
   // normalize followUrl
   followUrl = toOrigin(followUrl)
@@ -247,6 +303,10 @@ exports.unfollow = async function (archive, followUrl) {
 // internal methods
 // =
 
+/**
+ * @param {string} url
+ * @returns {string}
+ */
 function toOrigin (url) {
   try {
     url = new URL(url)
@@ -256,6 +316,10 @@ function toOrigin (url) {
   }
 }
 
+/**
+ * @param {InternalDatArchive} archive
+ * @returns {Promise<Object>}
+ */
 async function readFollowsFile (archive) {
   try {
     var followsJson = await archive.pda.readFile(JSON_PATH, 'utf8')
@@ -271,6 +335,11 @@ async function readFollowsFile (archive) {
   return followsJson
 }
 
+/**
+ * @param {InternalDatArchive} archive
+ * @param {(Object) => undefined} updateFn
+ * @returns {Promise}
+ */
 async function updateFollowsFile (archive, updateFn) {
   var release = await lock('crawler:followgraph:' + archive.url)
   try {
diff --git a/crawler/index.js b/crawler/index.js
index ef27b57f..bcb1c692 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -89,6 +89,7 @@ exports.crawlSite = async function (archive) {
       siteDescriptions.crawlSite(archive, crawlSource)
     ])
   } catch (err) {
+    console.error('Crawler error', {sourceUrl: archive.url, err: err.toString()})
     crawlerEvents.emit('crawl-error', {sourceUrl: archive.url, err: err.toString()})
   } finally {
     crawlerEvents.emit('crawl-finish', {sourceUrl: archive.url})
diff --git a/crawler/posts.js b/crawler/posts.js
index 517c65eb..c5e33378 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -3,6 +3,7 @@ const {URL} = require('url')
 const Events = require('events')
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
+const siteDescriptions = require('./site-descriptions')
 const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename} = require('./util')
 const debug = require('../lib/debug-logger').debugLogger('crawler')
 
@@ -13,6 +14,22 @@ const TABLE_VERSION = 1
 const JSON_TYPE = 'unwalled.garden/post'
 const JSON_PATH_REGEX = /^\/data\/posts\/([^/]+)\.json$/i
 
+// typedefs
+// =
+
+/**
+ * @typedef CrawlSourceRecord {import('./util').CrawlSourceRecord}
+ * @typedef SiteDescription { import("./site-descriptions").SiteDescription }
+ *
+ * @typedef {Object} Post
+ * @prop {string} pathname
+ * @prop {string} content
+ * @prop {number} crawledAt
+ * @prop {number} createdAt
+ * @prop {number} updatedAt
+ * @prop {SiteDescription} author
+ */
+
 // globals
 // =
 
@@ -25,6 +42,14 @@ exports.on = events.on.bind(events)
 exports.addListener = events.addListener.bind(events)
 exports.removeListener = events.removeListener.bind(events)
 
+/**
+ * @description
+ * Crawl the given site for posts.
+ *
+ * @param {InternalDatArchive} archive - site to crawl.
+ * @param {CrawlSourceRecord} crawlSource - internal metadata about the crawl target.
+ * @returns {Promise}
+ */
 exports.crawlSite = async function (archive, crawlSource) {
   return doCrawl(archive, crawlSource, 'crawl_posts', TABLE_VERSION, async ({changes, resetRequired}) => {
     const supressEvents = resetRequired === true // dont emit when replaying old info
@@ -100,6 +125,18 @@ exports.crawlSite = async function (archive, crawlSource) {
   })
 }
 
+/**
+ * @description
+ * List crawled posts.
+ *
+ * @param {Object} [opts]
+ * @param {string} [opts.author] - (URL) filter descriptions to those created by this author.
+ * @param {Array<string>} [opts.authors] - (URL) filter descriptions to those created by these authors.
+ * @param {number} [opts.offset]
+ * @param {number} [opts.limit]
+ * @param {boolean} [opts.reverse]
+ * @returns {Promise<Array<Post>>}
+ */
 exports.list = async function ({offset, limit, reverse, author, authors} = {}) {
   // validate & parse params
   assert(!offset || typeof offset === 'number', 'Offset must be a number')
@@ -145,9 +182,18 @@ exports.list = async function ({offset, limit, reverse, author, authors} = {}) {
   }
 
   // execute query
-  return (await db.all(query, values)).map(massagePostRow)
+  var rows = await db.all(query, values)
+  return Promise.all(rows.map(massagePostRow))
 }
 
+/**
+ * @description
+ * Get crawled post.
+ *
+ * @param {string} url - The URL of the post or of the author (if pathname is provided).
+ * @param {string} [pathname] - The pathname of the post.
+ * @returns {Promise<Post>}
+ */
 const get = exports.get = async function (url, pathname = undefined) {
   // validate & parse params
   if (url) {
@@ -157,7 +203,7 @@ const get = exports.get = async function (url, pathname = undefined) {
   pathname = pathname || url.pathname
 
   // execute query
-  return massagePostRow(await db.get(`
+  return await massagePostRow(await db.get(`
     SELECT
         crawl_posts.*, src.url AS crawlSourceUrl
       FROM crawl_posts
@@ -169,6 +215,15 @@ const get = exports.get = async function (url, pathname = undefined) {
   `, [url.origin, pathname]))
 }
 
+/**
+ * @description
+ * Create a new post.
+ *
+ * @param {InternalDatArchive} archive - where to write the post to.
+ * @param {Object} post
+ * @param {string} post.content
+ * @returns {Promise}
+ */
 exports.create = async function (archive, {content} = {}) {
   assert(typeof content === 'string', 'Create() must be provided a `content` string')
   var filename = generateTimeFilename()
@@ -182,6 +237,16 @@ exports.create = async function (archive, {content} = {}) {
   await crawler.crawlSite(archive)
 }
 
+/**
+ * @description
+ * Update the content of an existing post.
+ *
+ * @param {InternalDatArchive} archive - where to write the post to.
+ * @param {string} pathname - the pathname of the post.
+ * @param {Object} post
+ * @param {string} post.content
+ * @returns {Promise}
+ */
 exports.edit = async function (archive, pathname, {content} = {}) {
   assert(typeof pathname === 'string', 'Edit() must be provided a valid URL string')
   assert(typeof content === 'string', 'Edit() must be provided a `content` string')
@@ -195,6 +260,14 @@ exports.edit = async function (archive, pathname, {content} = {}) {
   await crawler.crawlSite(archive)
 }
 
+/**
+ * @description
+ * Delete an existing post
+ *
+ * @param {InternalDatArchive} archive - where to write the post to.
+ * @param {string} pathname - the pathname of the post.
+ * @returns {Promise}
+ */
 exports.delete = async function (archive, pathname) {
   assert(typeof pathname === 'string', 'Delete() must be provided a valid URL string')
   await archive.pda.unlink(pathname)
@@ -204,23 +277,42 @@ exports.delete = async function (archive, pathname) {
 // internal methods
 // =
 
+/**
+ * @param {string} v
+ * @returns {boolean}
+ */
 function isString (v) {
   return typeof v === 'string'
 }
 
+/**
+ * @param {string} url
+ * @returns {string}
+ */
 function toOrigin (url) {
   url = new URL(url)
   return url.protocol + '//' + url.hostname
 }
 
+/**
+ * @param {InternalDatArchive} archive
+ * @param {string} pathname
+ * @returns {Promise}
+ */
 async function ensureDirectory (archive, pathname) {
   try { await archive.pda.mkdir(pathname) }
   catch (e) { /* ignore */ }
 }
 
-function massagePostRow (row) {
+/**
+ * @param {Object} row
+ * @returns {Post}
+ */
+async function massagePostRow (row) {
   if (!row) return null
-  row.author = {url: row.crawlSourceUrl}
+  row.author = await siteDescriptions.getBest({subject: row.crawlSourceUrl})
+console.log('author for', row.author, row)
+  if (!row.author) row.author = {url: row.crawlSourceUrl}
   delete row.crawlSourceUrl
   delete row.crawlSourceId
   return row
diff --git a/crawler/search.js b/crawler/search.js
index 6c92b7db..abe5278f 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -7,6 +7,7 @@ const datLibrary = require('../dat/library')
 const followgraph = require('./followgraph')
 const siteDescriptions = require('./site-descriptions')
 const {getBasicType} = require('../lib/dat')
+const {getSiteDescriptionThumbnailUrl} = require('./util')
 
 /** @type {Array<Object>} */
 const BUILTIN_PAGES = [
@@ -23,17 +24,8 @@ const BUILTIN_PAGES = [
 // typedefs
 // =
 
-// exported api
-// =
-
 /**
- * @description
- * Get suggested content of various types.
- *
- * @param {string} [query=''] - The search query.
- * @param {Object} [opts={}]
- * @param {boolean} [opts.filterPins] - If true, will filter out pinned bookmarks.
- * @returns {Promise<SuggestionResults>}
+ * @typedef SiteDescription { import("./site-descriptions").SiteDescription }
  *
  * @typedef {Object} SuggestionResults
  * @prop {Array<Object>} apps
@@ -45,7 +37,42 @@ const BUILTIN_PAGES = [
  * @prop {(undefined|Array<Object>)} bookmarks
  * @prop {(undefined|Array<Object>)} history
  *
- * TODO: make the return values much more concrete
+ * TODO: define the SuggestionResults values
+ *
+ * @typedef {Object} SearchResults
+ * @prop {number} highlightNonce - A number used to create perimeters around text that should be highlighted.
+ * @prop {(null|Array<PeopleSearchResult>)} people
+ * @prop {(null|Array<PostSearchResult>)} posts
+ *
+ * @typedef {Object} PeopleSearchResult
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {Array<SiteDescription>} followedBy
+ * @prop {bool} followsUser
+ * @prop {string} thumbUrl
+ * @prop {Object} author
+ * @prop {string} author.url
+ *
+ * @typedef {Object} PostSearchResult
+ * @prop {string} url
+ * @prop {SiteDescription} author
+ * @prop {string} content
+ * @prop {number} createdAt
+ * @prop {number} updatedAt
+ */
+
+// exported api
+// =
+
+/**
+ * @description
+ * Get suggested content of various types.
+ *
+ * @param {string} [query=''] - The search query.
+ * @param {Object} [opts={}]
+ * @param {boolean} [opts.filterPins] - If true, will filter out pinned bookmarks.
+ * @returns {Promise<SuggestionResults>}
  */
 exports.listSuggestions = async function (query = '', opts = {}) {
   var suggestions = {}
@@ -99,39 +126,6 @@ exports.listSuggestions = async function (query = '', opts = {}) {
  * @param {number} [opts.offset]
  * @param {number} [opts.limit = 20]
  * @returns {Promise<SearchResults>}
- *
- * Search results:
- * @typedef {Object} SearchResults
- * @prop {number} highlightNonce - A number used to create perimeters around text that should be highlighted.
- * @prop {(null|Array<PeopleSearchResult>)} people
- * @prop {(null|Array<PostSearchResult>)} posts
- *
- * People search results:
- * @typedef {Object} PeopleSearchResult
- * @prop {string} url
- * @prop {string} title
- * @prop {string} description
- * @prop {Array<SiteDescription>} followedBy
- * @prop {bool} followsUser
- * @prop {Object} author
- * @prop {string} author.url
- *
- * Post search results:
- * @typedef {Object} PostSearchResult
- * @prop {string} url
- * @prop {SiteDescription} author
- * @prop {string} content
- * @prop {string} createdAt
- * @prop {string} [updatedAt]
- *
- * Site description objects:
- * @typedef {Object} SiteDescription
- * @prop {string} url
- * @prop {string} [title]
- * @prop {string} [description]
- * @prop {Array<string>} [type]
- * @prop {Object} [author]
- * @prop {string} [author.url]
  */
 exports.listSearchResults = async function (opts) {
   const highlightNonce =  (Math.random() * 1e3)|0
@@ -186,29 +180,38 @@ exports.listSearchResults = async function (opts) {
     if (query) {
       searchResults.people = await db.all(`
         SELECT
-            desc.subject AS url,
+            desc.url AS url,
             descSrc.url AS authorUrl,
             SNIPPET(crawl_site_descriptions_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title,
             SNIPPET(crawl_site_descriptions_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description
           FROM crawl_site_descriptions_fts_index desc_fts
           INNER JOIN crawl_site_descriptions desc ON desc.rowid = desc_fts.rowid
-          INNER JOIN crawl_followgraph fgraph ON fgraph.destUrl = desc.subject AND fgraph.crawlSourceId IN (${crawlSourceIds.join(',')})
+          LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = desc.url
           INNER JOIN crawl_sources descSrc ON desc.crawlSourceId = descSrc.id
-          WHERE crawl_site_descriptions_fts_index MATCH ?
+          WHERE
+            crawl_site_descriptions_fts_index MATCH ?
+            AND (
+              fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) -- description by a followed user
+              OR (desc.url = ? AND desc.crawlSourceId = ?) -- description by me about me
+            )
           ORDER BY rank
           LIMIT ?
           OFFSET ?;
-      `, [query, limit, offset])
+      `, [query, user, userCrawlSourceId, limit, offset])
     } else {
       searchResults.people = await db.all(`
-        SELECT desc.subject AS url, desc.title, desc.description, descSrc.url AS authorUrl
+        SELECT desc.url AS url, desc.title, desc.description, descSrc.url AS authorUrl
           FROM crawl_site_descriptions desc
-          INNER JOIN crawl_followgraph fgraph ON fgraph.destUrl = desc.subject AND fgraph.crawlSourceId IN (${crawlSourceIds.join(',')})
+          LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = desc.url
           INNER JOIN crawl_sources descSrc ON desc.crawlSourceId = descSrc.id
-          ORDER BY desc.createdAt
+          WHERE (
+            fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) -- description by a followed user
+            OR (desc.url = ? AND desc.crawlSourceId = ?) -- description by me about me
+          )
+          ORDER BY desc.title
           LIMIT ?
           OFFSET ?;
-      `, [limit, offset])      
+      `, [user, userCrawlSourceId, limit, offset])      
     }
     searchResults.people = _uniqWith(searchResults.people, (a, b) => a.url === b.url)
     await Promise.all(searchResults.people.map(async (p) => {
@@ -217,6 +220,7 @@ exports.listSearchResults = async function (opts) {
       p.followsUser = await followgraph.isAFollowingB(p.url, user)
 
       // massage attrs
+      p.thumbUrl = getSiteDescriptionThumbnailUrl(p.authorUrl, p.url)
       p.author = {url: p.authorUrl}
       delete p.authorUrl
     }))
@@ -265,17 +269,6 @@ exports.listSearchResults = async function (opts) {
       delete p.authorUrl
       delete p.pathname
     }))
-    // TODO hops == 2
-    /*searchResults.posts = await db.all(`
-      SELECT post.content, post.pathname, postSrc.url
-        FROM crawl_posts post
-        INNER JOIN crawl_sources postSrc ON post.crawlSourceId = postSrc.id
-        INNER JOIN crawl_followgraph fgraph ON fgraph.destUrl = postSrc.url AND fgraph.crawlSourceId = ?
-        WHERE (post.content MATCH ?) AND (post.createdAt >= ?)
-        ORDER BY rank
-        LIMIT ?
-        OFFSET ?;
-    `, [userCrawlSourceId, query, since, offset, limit])*/
   }
   
   return searchResults
diff --git a/crawler/site-descriptions.js b/crawler/site-descriptions.js
index 7e9c18e2..91dafd26 100644
--- a/crawler/site-descriptions.js
+++ b/crawler/site-descriptions.js
@@ -1,20 +1,42 @@
 const assert = require('assert')
 const {URL} = require('url')
 const Events = require('events')
-const _pick = require('lodash.pick')
 const db = require('../dbs/profile-data-db')
 const archivesDb = require('../dbs/archives')
 const dat = require('../dat')
 const crawler = require('./index')
-const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename} = require('./util')
+const {
+  doCrawl,
+  doCheckpoint,
+  emitProgressEvent,
+  getMatchingChangesInOrder,
+  generateTimeFilename,
+  getSiteDescriptionThumbnailUrl,
+  toHostname
+} = require('./util')
 const debug = require('../lib/debug-logger').debugLogger('crawler')
 
 // constants
 // =
 
 const TABLE_VERSION = 1
-const JSON_TYPE = 'unwalled.garden/site-description'
-const JSON_PATH_REGEX = /^\/data\/known_sites\/([^/]+)\.json$/i
+const JSON_PATH_REGEX = /^\/(dat\.json|data\/known_sites\/([^/]+)\/dat\.json)$/i
+
+// typedefs
+// =
+
+/**
+ * @typedef CrawlSourceRecord {import('./util').CrawlSourceRecord}
+ *
+ * @typedef {Object} SiteDescription
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {Array<string>} type
+ * @prop {string} thumbUrl
+ * @prop {Object} descAuthor
+ * @prop {string} descAuthor.url
+ */
 
 // globals
 // =
@@ -28,6 +50,14 @@ exports.on = events.on.bind(events)
 exports.addListener = events.addListener.bind(events)
 exports.removeListener = events.removeListener.bind(events)
 
+/**
+ * @description
+ * Crawl the given site for site descriptions.
+ *
+ * @param {InternalDatArchive} archive - site to crawl.
+ * @param {CrawlSourceRecord} crawlSource - internal metadata about the crawl target.
+ * @returns {Promise}
+ */
 exports.crawlSite = async function (archive, crawlSource) {
   return doCrawl(archive, crawlSource, 'crawl_site_descriptions', TABLE_VERSION, async ({changes, resetRequired}) => {
     const supressEvents = resetRequired === true // dont emit when replaying old info
@@ -52,11 +82,15 @@ exports.crawlSite = async function (archive, crawlSource) {
       //      this means that a single bad or unreachable file can stop the forward progress of description indexing
       //      to solve this, we need to find a way to tolerate bad description-files without losing our ability to efficiently detect new posts
       //      -prf
+
+      // determine the url
+      let url = getUrlFromDescriptionPath(archive, changedSiteDescription.name)
+
       if (changedSiteDescription.type === 'del') {
         // delete
         await db.run(`
-          DELETE FROM crawl_site_descriptions WHERE crawlSourceId = ? AND pathname = ?
-        `, [crawlSource.id, changedSiteDescription.name])
+          DELETE FROM crawl_site_descriptions WHERE crawlSourceId = ? AND url = ?
+        `, [crawlSource.id, url])
         events.emit('description-removed', archive.url)
       } else {
         // read and validate
@@ -64,38 +98,30 @@ exports.crawlSite = async function (archive, crawlSource) {
         try {
           desc = JSON.parse(await archive.pda.readFile(changedSiteDescription.name, 'utf8'))
           assert(typeof desc === 'object', 'File be an object')
-          assert(desc.type === 'unwalled.garden/site-description', 'JSON .type must be unwalled.garden/site-description')
-          assert(typeof desc.subject === 'string', 'JSON .subject must be a URL string')
-          try { let subject = new URL(desc.subject) }
-          catch (e) { throw new Error('JSON .subject must be a URL string') }
-          assert(desc.metadata && typeof desc.metadata === 'object', 'JSON .metadata must be object')
-          assert(typeof desc.createdAt === 'string', 'JSON .createdAt must be a date-time')
-          assert(!isNaN(Number(new Date(desc.createdAt))), 'JSON .createdAt must be a date-time')
         } catch (err) {
+          console.error('Failed to read site-description file', {url: archive.url, name: changedSiteDescription.name, err})
           debug('Failed to read site-description file', {url: archive.url, name: changedSiteDescription.name, err})
           return // abort indexing
         }
 
         // massage the description
-        desc.subject = toOrigin(desc.subject)
-        desc.metadata.title = typeof desc.metadata.title === 'string' ? desc.metadata.title : ''
-        desc.metadata.description = typeof desc.metadata.description === 'string' ? desc.metadata.description : ''
-        if (typeof desc.metadata.type === 'string') desc.metadata.type = desc.metadata.type.split(',')
-        if (Array.isArray(desc.metadata.type)) {
-          desc.metadata.type = desc.metadata.type.filter(isString)
+        desc.title = typeof desc.title === 'string' ? desc.title : ''
+        desc.description = typeof desc.description === 'string' ? desc.description : ''
+        if (typeof desc.type === 'string') desc.type = desc.type.split(',')
+        if (Array.isArray(desc.type)) {
+          desc.type = desc.type.filter(isString)
         } else {
-          desc.metadata.type = []
+          desc.type = []
         }
-        desc.createdAt = Number(new Date(desc.createdAt))
 
         // replace
         await db.run(`
-          DELETE FROM crawl_site_descriptions WHERE crawlSourceId = ? AND pathname = ?
-        `, [crawlSource.id, changedSiteDescription.name])
+          DELETE FROM crawl_site_descriptions WHERE crawlSourceId = ? AND url = ?
+        `, [crawlSource.id, url])
         await db.run(`
-          INSERT OR REPLACE INTO crawl_site_descriptions (crawlSourceId, pathname, crawledAt, subject, title, description, type, createdAt)
-            VALUES (?, ?, ?, ?, ?, ?, ?, ?)
-        `, [crawlSource.id, changedSiteDescription.name, Date.now(), desc.subject, desc.metadata.title, desc.metadata.description, desc.metadata.type.join(','), desc.createdAt])
+          INSERT OR REPLACE INTO crawl_site_descriptions (crawlSourceId, crawledAt, url, title, description, type)
+            VALUES (?, ?, ?, ?, ?, ?)
+        `, [crawlSource.id, Date.now(), url, desc.title, desc.description, desc.type.join(',')])
         events.emit('description-added', archive.url)
       }
 
@@ -106,6 +132,18 @@ exports.crawlSite = async function (archive, crawlSource) {
   })
 }
 
+/**
+ * @description
+ * List crawled site descriptions.
+ *
+ * @param {Object} [opts]
+ * @param {string} [opts.subject] - (URL) filter descriptions to those which describe this subject.
+ * @param {string} [opts.author] - (URL) filter descriptions to those created by this author.
+ * @param {number} [opts.offset]
+ * @param {number} [opts.limit]
+ * @param {boolean} [opts.reverse]
+ * @returns {Promise<Array<SiteDescription>>}
+ */
 const list = exports.list = async function ({offset, limit, reverse, author, subject} = {}) {
   // validate & parse params
   assert(!offset || typeof offset === 'number', 'Offset must be a number')
@@ -153,13 +191,12 @@ const list = exports.list = async function ({offset, limit, reverse, author, sub
     query += `(`
     let op = ``
     for (let s of subject) {
-      query += `${op} subject = ?`
+      query += `${op} crawl_site_descriptions.url = ?`
       op = ` OR`
       values.push(s)
     }
     query += `) `
   }
-  query += ` ORDER BY createdAt`
   if (reverse) {
     query += ` DESC`
   }
@@ -176,141 +213,140 @@ const list = exports.list = async function ({offset, limit, reverse, author, sub
   return (await db.all(query, values)).map(massageSiteDescriptionRow)
 }
 
+/**
+ * @description
+ * Get the most trustworthy site description available.
+ *
+ * @param {Object} [opts]
+ * @param {string} [opts.subject] - (URL) filter descriptions to those which describe this subject.
+ * @param {string} [opts.author] - (URL) filter descriptions to those created by this author.
+ * @returns {Promise<SiteDescription>}
+ */
 exports.getBest = async function ({subject, author} = {}) {
-  // TODO
-  // while the archivesdb is more recent, it won't have the thumbnail
-  // -prf
-  // check archivesDb meta
-  // var meta = await archivesDb.getMeta(subject)
-  // if (meta) {
-  //   return _pick(meta, ['title', 'description', 'type'])
-  // }
-
-  // check for descriptions
+  // TODO choose based on trust
   var descriptions = await list({subject, author})
-  return _pick(descriptions[0] || {}, ['title', 'description', 'type', 'author'])
-}
-
-const get = exports.get = async function (url, pathname = undefined) {
-  // validate & parse params
-  if (url) {
-    try { url = new URL(url) }
-    catch (e) { throw new Error('Failed to parse post URL: ' + url) }
-  }
-  pathname = pathname || url.pathname
-
-  // execute query
-  return massageSiteDescriptionRow(await db.get(`
-    SELECT
-        crawl_site_descriptions.*, src.url AS crawlSourceUrl
-      FROM crawl_site_descriptions
-      INNER JOIN crawl_sources src
-        ON src.id = crawl_site_descriptions.crawlSourceId
-        AND src.url = ?
-      WHERE
-        crawl_site_descriptions.pathname = ?
-  `, [url.origin, pathname]))
+  return descriptions[0]
 }
 
+/**
+ * @description
+ * Capture a site description into the archive's known_sites cache.
+ *
+ * @param {InternalDatArchive} archive - where to write the capture to.
+ * @param {(InternalDatArchive|string)} subjectArchive - which archive to capture.
+ * @returns Promise
+ */
 exports.capture = async function (archive, subjectArchive) {
   if (typeof subjectArchive === 'string') {
     subjectArchive = await dat.library.getOrLoadArchive(subjectArchive)
   }
 
-  // capture metadata
+  // create directory
+  var hostname = toHostname(subjectArchive.url)
+  await ensureDirectory(archive, '/data')
+  await ensureDirectory(archive, '/data/known_sites')
+  await ensureDirectory(archive, `/data/known_sites/${hostname}`)
+
+  // capture dat.json
   try {
-    var info = JSON.parse(await subjectArchive.pda.readFile('/dat.json'))
+    var datJson = JSON.parse(await subjectArchive.pda.readFile('/dat.json'))
   } catch (e) {
     console.error('Failed to read dat.json of subject archive', e)
     debug('Failed to read dat.json of subject archive', e)
     throw new Error('Unabled to read subject dat.json')
   }
-  await put(archive, {
-    subject: subjectArchive.url,
-    title: typeof info.title === 'string' ? info.title : undefined,
-    description: typeof info.description === 'string' ? info.description : undefined,
-    type: typeof info.type === 'string' || (Array.isArray(info.type) && info.type.every(isString)) ? info.type : undefined
-  })
+  await archive.pda.writeFile(`/data/known_sites/${hostname}/dat.json`, JSON.stringify(datJson))
 
   // capture thumb
   for (let ext of ['jpg', 'jpeg', 'png']) {
     let thumbPath = `/thumb.${ext}`
     if (await fileExists(subjectArchive, thumbPath)) {
-      let targetPath = `/data/known_sites/${toHostname(subjectArchive.url)}.${ext}`
+      let targetPath = `/data/known_sites/${hostname}/thumb.${ext}`
       await archive.pda.writeFile(targetPath, await subjectArchive.pda.readFile(thumbPath, 'binary'), 'binary')
       break
     }
   }
 }
 
-const put =
-exports.put = async function (archive, {subject, title, description, type} = {}) {
-  assert(typeof subject === 'string', 'Put() must be provided a `subject` string')
-  try {
-    var subjectUrl = new URL(subject)
-  } catch (e) {
-    throw new Error('Put() `subject` must be a valid URL')
-  }
-  assert(!title || typeof title === 'string', 'Put() `title` must be a string')
-  assert(!description || typeof description === 'string', 'Put() `description` must be a string')
-  if (type) {
-    if (typeof type === 'string') type = type.split(',')
-    assert(Array.isArray(type), 'Put() `type` must be a string or an array of strings')
-    assert(type.every(isString), 'Put() `type` must be a string or an array of strings')
+/**
+ * @description
+ * Delete a captured site description in the given archive's known_sites cache.
+ *
+ * @param {InternalDatArchive} archive - where to remove the capture from.
+ * @param {(InternalDatArchive|string)} subjectUrl - which archive's capture to remove.
+ * @returns Promise
+ */
+exports.deleteCapture = async function (archive, subjectUrl) {
+  if (subjectUrl && subjectUrl.url) {
+    subjectUrl = subjectUrl.url
   }
-  await ensureDirectory(archive, '/data')
-  await ensureDirectory(archive, '/data/known_sites')
-  await archive.pda.writeFile(`/data/known_sites/${subjectUrl.hostname}.json`, JSON.stringify({
-    type: JSON_TYPE,
-    subject: subjectUrl.toString(),
-    metadata: {
-      title,
-      description,
-      type
-    },
-    createdAt: (new Date()).toISOString()
-  }))
-  await crawler.crawlSite(archive)
-}
-
-exports.delete = async function (archive, pathname) {
-  assert(typeof pathname === 'string', 'Delete() must be provided a valid URL string')
-  await archive.pda.unlink(pathname)
+  assert(typeof subjectUrl === 'string', 'Delete() must be provided a valid URL string')
+  var hostname = toHostname(subjectUrl)
+  await archive.pda.rmdir(`/data/known_sites/${hostname}`, {recursive: true})
   await crawler.crawlSite(archive)
 }
 
 // internal methods
 // =
 
+/**
+ * @param {any} v
+ * returns {boolean}
+ */
 function isString (v) {
   return typeof v === 'string'
 }
 
+/**
+ * @param {string} url
+ * @returns {string}
+ */
 function toOrigin (url) {
   url = new URL(url)
   return url.protocol + '//' + url.hostname
 }
 
-function toHostname (url) {
-  url = new URL(url)
-  return url.hostname
+/**
+ * @param {InternalDatArchive} archive
+ * @param {string} name
+ * @returns {string}
+ */
+function getUrlFromDescriptionPath (archive, name) {
+  if (name === '/dat.json') return archive.url
+  name = name.split('/') // '/data/known_sites/{hostname}/dat.json' -> ['', 'data', 'known_sites', hostname, 'dat.json']
+  return 'dat://' + name[3]
 }
 
+/**
+ * @param {InternalDatArchive} archive
+ * @param {string} pathname
+ * @returns {Promise}
+ */
 async function ensureDirectory (archive, pathname) {
   try { await archive.pda.mkdir(pathname) }
   catch (e) { /* ignore */ }
 }
 
+/**
+ * @param {InternalDatArchive} archive
+ * @param {string} pathname
+ * @returns {Promise}
+ */
 async function fileExists (archive, pathname) {
   try { await archive.pda.stat(pathname) }
   catch (e) { return false }
   return true
 }
 
+/**
+ * @param {Object} row
+ * @returns {SiteDescription}
+ */
 function massageSiteDescriptionRow (row) {
   if (!row) return null
   row.author = {url: row.crawlSourceUrl}
   row.type = row.type && typeof row.type === 'string' ? row.type.split(',') : undefined
+  row.thumbUrl = getSiteDescriptionThumbnailUrl(row.author.url, row.url)
   delete row.crawlSourceUrl
   delete row.crawlSourceId
   return row
diff --git a/crawler/util.js b/crawler/util.js
index 04a9f7b2..657e0d6f 100644
--- a/crawler/util.js
+++ b/crawler/util.js
@@ -6,9 +6,29 @@ const dat = require('../dat')
 
 const READ_TIMEOUT = 30e3
 
+// typedefs
+// =
+
+/**
+ * @typedef {Object} CrawlSourceRecord
+ * @prop {string} id
+ * @prop {string} url
+ */
+
+// exported api
+// =
+
 const crawlerEvents = new EventEmitter()
 exports.crawlerEvents = crawlerEvents
 
+/**
+ * @param {InternalDatArchive} archive
+ * @param {CrawlSourceRecord} crawlSource
+ * @param {string} crawlDataset
+ * @param {number} crawlDatasetVersion
+ * @param {(Object) => undefined} handlerFn
+ * @returns {Promise}
+ */
 exports.doCrawl = async function (archive, crawlSource, crawlDataset, crawlDatasetVersion, handlerFn) {
   const url = archive.url
 
@@ -53,6 +73,13 @@ exports.doCrawl = async function (archive, crawlSource, crawlDataset, crawlDatas
   crawlerEvents.emit('crawl-dataset-finish', {sourceUrl: archive.url, crawlDataset, crawlRange: {start, end}})
 }
 
+/**
+ * @param {string} crawlDataset
+ * @param {number} crawlDatasetVersion
+ * @param {CrawlSourceRecord} crawlSource
+ * @param {number} crawlSourceVersion
+ * @returns {Promise}
+ */
 const doCheckpoint = exports.doCheckpoint = async function (crawlDataset, crawlDatasetVersion, crawlSource, crawlSourceVersion) {
   await db.run(`DELETE FROM crawl_sources_meta WHERE crawlDataset = ? AND crawlSourceId = ?`, [crawlDataset, crawlSource.id])
   await db.run(`
@@ -62,10 +89,21 @@ const doCheckpoint = exports.doCheckpoint = async function (crawlDataset, crawlD
   `, [crawlDataset, crawlDatasetVersion, crawlSource.id, crawlSourceVersion, Date.now()])
 }
 
+/**
+ * @param {string} sourceUrl
+ * @param {string} crawlDataset
+ * @param {number} progress
+ * @param {number} numUpdates
+ */
 exports.emitProgressEvent = function (sourceUrl, crawlDataset, progress, numUpdates) {
   crawlerEvents.emit('crawl-dataset-progress', {sourceUrl, crawlDataset, progress, numUpdates})
 }
 
+/**
+ * @param {Array<Object>} changes
+ * @param {RegExp} regex
+ * @returns {Array<Object>}
+ */
 exports.getMatchingChangesInOrder = function (changes, regex) {
   var list = [] // order matters, must be oldest to newest
   changes.forEach(c => {
@@ -78,6 +116,9 @@ exports.getMatchingChangesInOrder = function (changes, regex) {
   return list
 }
 
+/**
+ * @returns {string}
+ */
 var _lastGeneratedTimeFilename
 exports.generateTimeFilename = function () {
   var d = Date.now()
@@ -86,4 +127,26 @@ exports.generateTimeFilename = function () {
   }
   _lastGeneratedTimeFilename = d
   return (new Date(d)).toISOString()
-}
\ No newline at end of file
+}
+
+/**
+ * @param {string} url
+ * @returns {string}
+ */
+const toHostname =
+exports.toHostname = function (url) {
+  url = new URL(url)
+  return url.hostname
+}
+
+/**
+ * @description Helper to determine the thumbUrl for a site description.
+ * @param {string} author - (URL) the author of the site description.
+ * @param {string} subject - (URL) the site being described.
+ * @returns {string} - the URL of the thumbnail.
+ */
+exports.getSiteDescriptionThumbnailUrl = function (author, subject) {
+  return author === subject
+    ? `${subject}/thumb` // self-description, use their own thumb
+    : `${author}/data/known_sites/${toHostname(subject)}/thumb` // use captured thumb
+}
diff --git a/dbs/profile-data-db.js b/dbs/profile-data-db.js
index 542ea376..a4c919b4 100644
--- a/dbs/profile-data-db.js
+++ b/dbs/profile-data-db.js
@@ -79,8 +79,7 @@ migrations = [
   migration('profile-data.v21.sql'),
   migration('profile-data.v22.sql', {canFail: true}), // canFail for the same reason as v16, ffs
   migration('profile-data.v23.sql'),
-  migration('profile-data.v24.sql'),
-  migration('profile-data.v25.sql')
+  migration('profile-data.v24.sql')
 ]
 function migration (file, opts = {}) {
   return cb => {
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index f59bada2..a2310263 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -132,16 +132,13 @@ CREATE TABLE crawl_sources_meta (
 -- crawled descriptions of other sites
 CREATE TABLE crawl_site_descriptions (
   crawlSourceId INTEGER NOT NULL,
-  pathname TEXT NOT NULL,
   crawledAt INTEGER,
 
-  subject TEXT,
+  url TEXT,
   title TEXT,
   description TEXT,
   type TEXT, -- comma separated strings
-  createdAt INTEGER,
 
-  PRIMARY KEY (crawlSourceId, pathname),
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
 CREATE VIRTUAL TABLE crawl_site_descriptions_fts_index USING fts5(title, description, content='crawl_site_descriptions');
@@ -258,5 +255,5 @@ INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Report an issu
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Explore the p2p Web', 'dat://taravancil.com/explore-the-p2p-web.md', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker', 'https://opencollective.com/beaker', 1);
 
-PRAGMA user_version = 25;
+PRAGMA user_version = 24;
 `
diff --git a/dbs/schemas/profile-data.v24.sql.js b/dbs/schemas/profile-data.v24.sql.js
index e9b7bb71..eae3dcd7 100644
--- a/dbs/schemas/profile-data.v24.sql.js
+++ b/dbs/schemas/profile-data.v24.sql.js
@@ -27,18 +27,29 @@ CREATE TABLE crawl_sources_meta (
 -- crawled descriptions of other sites
 CREATE TABLE crawl_site_descriptions (
   crawlSourceId INTEGER NOT NULL,
-  pathname TEXT NOT NULL,
   crawledAt INTEGER,
 
-  subject TEXT,
+  url TEXT,
   title TEXT,
   description TEXT,
   type TEXT, -- comma separated strings
-  createdAt INTEGER,
 
   PRIMARY KEY (crawlSourceId, pathname),
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
+CREATE VIRTUAL TABLE crawl_site_descriptions_fts_index USING fts5(title, description, content='crawl_site_descriptions');
+
+-- triggers to keep crawl_site_descriptions_fts_index updated
+CREATE TRIGGER crawl_site_descriptions_ai AFTER INSERT ON crawl_site_descriptions BEGIN
+  INSERT INTO crawl_site_descriptions_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
+END;
+CREATE TRIGGER crawl_site_descriptions_ad AFTER DELETE ON crawl_site_descriptions BEGIN
+  INSERT INTO crawl_site_descriptions_fts_index(crawl_site_descriptions_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
+END;
+CREATE TRIGGER crawl_site_descriptions_au AFTER UPDATE ON crawl_site_descriptions BEGIN
+  INSERT INTO crawl_site_descriptions_fts_index(crawl_site_descriptions_fts_index, rowid, title, description) VALUES('delete', old.a, old.title, old.description);
+  INSERT INTO crawl_site_descriptions_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
+END;
 
 -- crawled posts
 CREATE TABLE crawl_posts (
@@ -52,6 +63,19 @@ CREATE TABLE crawl_posts (
 
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
+CREATE VIRTUAL TABLE crawl_posts_fts_index USING fts5(content, content='crawl_posts');
+
+-- triggers to keep crawl_posts_fts_index updated
+CREATE TRIGGER crawl_posts_ai AFTER INSERT ON crawl_posts BEGIN
+  INSERT INTO crawl_posts_fts_index(rowid, content) VALUES (new.rowid, new.content);
+END;
+CREATE TRIGGER crawl_posts_ad AFTER DELETE ON crawl_posts BEGIN
+  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, content) VALUES('delete', old.rowid, old.content);
+END;
+CREATE TRIGGER crawl_posts_au AFTER UPDATE ON crawl_posts BEGIN
+  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, content) VALUES('delete', old.rowid, old.content);
+  INSERT INTO crawl_posts_fts_index(rowid, content) VALUES (new.rowid, new.content);
+END;
 
 -- crawled follows
 CREATE TABLE crawl_followgraph (
diff --git a/dbs/schemas/profile-data.v25.sql.js b/dbs/schemas/profile-data.v25.sql.js
deleted file mode 100644
index b84e73a1..00000000
--- a/dbs/schemas/profile-data.v25.sql.js
+++ /dev/null
@@ -1,32 +0,0 @@
-module.exports = `
-
--- add full-text search indexes
-CREATE VIRTUAL TABLE crawl_site_descriptions_fts_index USING fts5(title, description, content='crawl_site_descriptions');
-CREATE VIRTUAL TABLE crawl_posts_fts_index USING fts5(content, content='crawl_posts');
-
--- triggers to keep crawl_site_descriptions_fts_index updated
-CREATE TRIGGER crawl_site_descriptions_ai AFTER INSERT ON crawl_site_descriptions BEGIN
-  INSERT INTO crawl_site_descriptions_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
-END;
-CREATE TRIGGER crawl_site_descriptions_ad AFTER DELETE ON crawl_site_descriptions BEGIN
-  INSERT INTO crawl_site_descriptions_fts_index(crawl_site_descriptions_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
-END;
-CREATE TRIGGER crawl_site_descriptions_au AFTER UPDATE ON crawl_site_descriptions BEGIN
-  INSERT INTO crawl_site_descriptions_fts_index(crawl_site_descriptions_fts_index, rowid, title, description) VALUES('delete', old.a, old.title, old.description);
-  INSERT INTO crawl_site_descriptions_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
-END;
-
--- triggers to keep crawl_posts_fts_index updated
-CREATE TRIGGER crawl_posts_ai AFTER INSERT ON crawl_posts BEGIN
-  INSERT INTO crawl_posts_fts_index(rowid, content) VALUES (new.rowid, new.content);
-END;
-CREATE TRIGGER crawl_posts_ad AFTER DELETE ON crawl_posts BEGIN
-  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, content) VALUES('delete', old.rowid, old.content);
-END;
-CREATE TRIGGER crawl_posts_au AFTER UPDATE ON crawl_posts BEGIN
-  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, content) VALUES('delete', old.rowid, old.content);
-  INSERT INTO crawl_posts_fts_index(rowid, content) VALUES (new.rowid, new.content);
-END;
-
-PRAGMA user_version = 25;
-`
\ No newline at end of file

From c0419be3bf3b12150e0c9b6259415b305f71e44a Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 11 Jan 2019 19:05:33 -0600
Subject: [PATCH 054/245] Move crawler to a priority queueing system

---
 crawler/followgraph.js |   2 +-
 crawler/index.js       |  23 ++-----
 crawler/search.js      |   8 +--
 users/index.js         | 145 +++++++++++++++++++++++++++--------------
 4 files changed, 106 insertions(+), 72 deletions(-)

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index 7f967e2e..21cee3fd 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -188,7 +188,7 @@ const listFollows = exports.listFollows = async function (subject, {followedBy,
   }
   return Promise.all(rows.map(async (row) => {
     var url = toOrigin(row.destUrl)
-    var desc = await siteDescriptions.getBest({subject: url, author: subject})
+    var desc = (await siteDescriptions.getBest({subject: url, author: subject})) || {}
     desc.url = url
     if (followedBy) {
       desc.followsUser = await isAFollowingB(url, followedBy)
diff --git a/crawler/index.js b/crawler/index.js
index bcb1c692..52bbd18d 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -7,17 +7,15 @@ const archivesDb = require('../dbs/archives')
 const users = require('../users')
 const dat = require('../dat')
 
-const {crawlerEvents} = require('./util')
+const {crawlerEvents, toHostname} = require('./util')
 const posts = require('./posts')
 const followgraph = require('./followgraph')
 const siteDescriptions = require('./site-descriptions')
 
-const CRAWL_POLL_INTERVAL = 30e3
-
 // globals
 // =
 
-const watches = {}
+var watches = {}
 
 // exported api
 // =
@@ -43,18 +41,13 @@ exports.watchSite = async function (archive) {
     // watch for file changes
     watches[archive.url] = archive.pda.watch()
     watches[archive.url].on('data', ([event, args]) => {
+      // BUG watch is really inconsistent -prf
       console.log('MIRACLE ALERT! The crawler watch stream emitted a change event', archive.url, event, args)
       if (event === 'invalidated') {
         queueCrawl()
       }
     })
 
-    // HACK
-    // for reasons that currently surpass me
-    // the `archive.pda.watch()` call is not currently working all the time
-    // so we need to poll sites for now
-    setInterval(queueCrawl, CRAWL_POLL_INTERVAL)
-
     // run the first crawl
     crawlSite(archive)
   }
@@ -136,12 +129,4 @@ exports.WEBAPI = {
     return crawlSite(archive)
   },
   resetSite
-}
-
-// internal methods
-// =
-
-function toHostname (url) {
-  url = new URL(url)
-  return url.hostname
-}
+}
\ No newline at end of file
diff --git a/crawler/search.js b/crawler/search.js
index abe5278f..ffeeb2f5 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -150,7 +150,7 @@ exports.listSearchResults = async function (opts) {
   if (query && typeof query === 'string') {
     query = query
       .toLowerCase() // all lowercase. (uppercase is interpretted as a directive by sqlite.)
-      .replace(/[:^*\.]/g, ' ') // strip symbols that sqlite interprets.
+      .replace(/[:^*.]/g, ' ') // strip symbols that sqlite interprets.
     query += '*' // match prefixes
   }
 
@@ -211,7 +211,7 @@ exports.listSearchResults = async function (opts) {
           ORDER BY desc.title
           LIMIT ?
           OFFSET ?;
-      `, [user, userCrawlSourceId, limit, offset])      
+      `, [user, userCrawlSourceId, limit, offset])
     }
     searchResults.people = _uniqWith(searchResults.people, (a, b) => a.url === b.url)
     await Promise.all(searchResults.people.map(async (p) => {
@@ -258,7 +258,7 @@ exports.listSearchResults = async function (opts) {
           ORDER BY post.createdAt DESC
           LIMIT ?
           OFFSET ?;
-      `, [userCrawlSourceId, since, limit, offset])      
+      `, [userCrawlSourceId, since, limit, offset])
     }
     await Promise.all(searchResults.posts.map(async (p) => {
       // fetch additional info
@@ -270,6 +270,6 @@ exports.listSearchResults = async function (opts) {
       delete p.pathname
     }))
   }
-  
+
   return searchResults
 }
diff --git a/users/index.js b/users/index.js
index b8e00e7f..e90b615f 100644
--- a/users/index.js
+++ b/users/index.js
@@ -1,6 +1,7 @@
 const Events = require('events')
 const dat = require('../dat')
 const crawler = require('../crawler')
+const followgraph = require('../crawler/followgraph')
 const db = require('../dbs/profile-data-db')
 const archivesDb = require('../dbs/archives')
 const debug = require('../lib/debug-logger').debugLogger('users')
@@ -9,6 +10,8 @@ const debug = require('../lib/debug-logger').debugLogger('users')
 // =
 
 const SITE_TYPE = 'unwalled.garden/user'
+const CRAWL_TICK_INTERVAL = 5e3
+const NUM_SIMULTANEOUS_CRAWLS = 10
 
 // globals
 // =
@@ -24,9 +27,8 @@ exports.addListener = events.addListener.bind(events)
 exports.removeListener = events.removeListener.bind(events)
 
 exports.setup = async function () {
-  // wire up events
-  crawler.followgraph.on('follow-added', onFollowAdded)
-  crawler.followgraph.on('follow-removed', onFollowRemoved)
+  // initiate ticker
+  queueTick()
 
   // load the current users
   users = await db.all(`SELECT * FROM users`)
@@ -42,7 +44,7 @@ exports.setup = async function () {
     try {
       await validateUserUrl(user.url)
       user.archive = await dat.library.getOrLoadArchive(user.url)
-      watchUser(user)
+      /* dont await */crawler.watchSite(user.archive)
       events.emit('load-user', user)
     } catch (err) {
       debug('Failed to load user', {user, err})
@@ -50,6 +52,49 @@ exports.setup = async function () {
   })
 }
 
+function queueTick () {
+  setTimeout(tick, CRAWL_TICK_INTERVAL)
+}
+
+async function tick () {
+  try {
+    // TODO handle multiple users
+    var user = users[0]
+    if (!user) return queueTick()
+
+    // assemble the next set of crawl targets
+    var crawlTargets = await selectNextCrawlTargets(user)
+
+    // trigger the crawls on each
+    var activeCrawls = crawlTargets.map(async (crawlTarget) => {
+      try {
+        // load archive
+        var wasLoaded = true // TODO
+        var archive = await dat.library.getOrLoadArchive(crawlTarget) // TODO timeout on load
+
+        // run crawl
+        await crawler.crawlSite(archive)
+
+        if (!wasLoaded) {
+          // unload archive
+          // TODO
+        }
+      } catch (e) {
+        console.error('Failed to crawl site', crawlTarget, e)
+        // TODO more handling?
+      }
+    })
+
+    // await all crawls
+    await Promise.all(activeCrawls)
+  } catch (e) {
+    console.error('Crawler tick failed', e)
+  }
+
+  // queue next tick
+  queueTick()
+}
+
 exports.list = async function () {
   return Promise.all(users.map(fetchUserInfo))
 }
@@ -94,7 +139,7 @@ exports.add = async function (url) {
 
   // fetch the user archive
   user.archive = await dat.library.getOrLoadArchive(user.url)
-  watchUser(user)
+  /* dont await */crawler.watchSite(user.archive)
   events.emit('load-user', user)
 }
 
@@ -107,7 +152,7 @@ exports.remove = async function (url) {
   // remove the user
   users.splice(users.indexOf(user), 1)
   await db.run(`DELETE FROM users WHERE url = ?`, [user.url])
-  unwatchUser(user)
+  /* dont await */crawler.unwatchSite(user.archive)
   events.emit('unload-user', user)
 }
 
@@ -118,50 +163,54 @@ async function isUser (url) {
   return !!(await get(url))
 }
 
-async function watchUser (user) {
-  // watch the user
-  await crawler.watchSite(user.archive)
-
-  // watch anybody the user follows
-  var followUrls = await crawler.followgraph.listFollows(user.url)
-  followUrls.forEach(async (followUrl) => {
-    try {
-      await crawler.watchSite(followUrl)
-    } catch (err) {
-      debug('Failed to sync followed user', {url: followUrl, err})
-    }
-  })
-}
-
-async function unwatchUser (user) {
-  // unwatch anybody the user follows
-
-  // BUG This will cause glitches if there are any shared follows between 2 local users (which is likely)
-  //     sites will be unwatched when they shouldn't be
-  //     this is temporary and will fix itself when beaker restarts
-  //     -prf
-
-  var followUrls = await crawler.followgraph.listFollows(user.url)
-  followUrls.forEach(crawler.unwatchSite)
-
-  // unwatch the user
-  await crawler.unwatchSite(user.url)
-}
-
-async function onFollowAdded (sourceUrl, subjectUrl) {
-  if (isUser(sourceUrl)) {
-    try {
-      await crawler.watchSite(subjectUrl)
-    } catch (err) {
-      debug('Failed to sync followed user', {url: subjectUrl, err})
-    }
+/**
+ * @description
+ * Assembles a list of crawl targets based on the current database state.
+ *
+ * @param {Object} user - the user to select crawl-targets for.
+ * @returns {Promise<Array<string>>}
+ *
+ * Depends on NUM_SIMULTANEOUS_CRAWLS.
+ *
+ * This function will assemble the list using simple priority heuristics. The priorities are currently:
+ *
+ *  1. Followed sites
+ *  2. Sites published by followed sites
+ *  3. Sites followed by followed sites
+ *
+ * The sites will be ordered by these priorities and then iterated linearly. The ordering within
+ * the priority groupings will be according to URL for a deterministic but effectively random ordering.
+ *
+ * NOTE. The current database state must be queried every time this function is run because the user
+ * will follow and unfollow during runtime, which changes the list.
+ */
+async function selectNextCrawlTargets (user) {
+  var rows = []
+
+  // get followed sites
+  rows = rows.concat(await followgraph.listFollows(user.url))
+
+  // get sites published by followed sites
+  // TODO
+
+  // get sites followed by followed sites
+  rows = rows.concat(await followgraph.listFoaFs(user.url))
+
+  // assemble into list
+  var start = user.crawlSelectorCursor || 0
+  if (start > rows.length) start = 0
+  var end = start + NUM_SIMULTANEOUS_CRAWLS
+  var nextCrawlTargets = rows.slice(start, end)
+  var numRemaining = NUM_SIMULTANEOUS_CRAWLS - nextCrawlTargets.length
+  if (numRemaining && rows.length > NUM_SIMULTANEOUS_CRAWLS) {
+    // wrap around
+    nextCrawlTargets = nextCrawlTargets.concat(rows.slice(0, numRemaining))
+    user.crawlSelectorCursor = numRemaining
+  } else {
+    user.crawlSelectorCursor = end
   }
-}
 
-async function onFollowRemoved (sourceUrl, subjectUrl) {
-  if (isUser(sourceUrl)) {
-    await crawler.unwatchSite(subjectUrl)
-  }
+  return nextCrawlTargets.map(row => typeof row === 'string' ? row : row.url)
 }
 
 async function fetchUserInfo (user) {

From e6b8a81b0f2fbf365aa78ea453ef587dadd72d58 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 12 Jan 2019 17:18:16 -0600
Subject: [PATCH 055/245] More JSDoc type annotations

---
 crawler/followgraph.js       | 40 +++++++++++++++-----------------
 crawler/posts.js             | 23 +++++++++---------
 crawler/search.js            |  2 +-
 crawler/site-descriptions.js | 45 +++++++++++++++++++++---------------
 crawler/util.js              |  8 ++++---
 dat/library.js               | 43 ++++++++++++++++++++++++++++++++++
 6 files changed, 106 insertions(+), 55 deletions(-)

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index 21cee3fd..e1124bfd 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -1,7 +1,7 @@
 const assert = require('assert')
 const _difference = require('lodash.difference')
 const Events = require('events')
-const {Url} = require('url')
+const {URL} = require('url')
 const lock = require('../lib/lock')
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
@@ -20,13 +20,9 @@ const JSON_PATH = '/data/follows.json'
 // =
 
 /**
- * @typedef CrawlSourceRecord {import('./util').CrawlSourceRecord}
- * @typedef SiteDescription {import('./site-descriptions').SiteDescription}
- *
- * @typedef {Object} SiteDescriptionWithFollowData
- * @extends {SiteDescription}
- * @prop {boolean} [followsUser] - does this site follow the specified user site?
- * @prop {Array<SiteDescription>} [followedBy] - list of sites following this site.
+ * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
+ * @typedef {import('./util').CrawlSourceRecord} CrawlSourceRecord
+ * @typedef {import('./site-descriptions').SiteDescription} SiteDescription
  */
 
 // globals
@@ -47,7 +43,7 @@ exports.removeListener = events.removeListener.bind(events)
  *
  * @param {InternalDatArchive} archive - site to crawl.
  * @param {CrawlSourceRecord} crawlSource - internal metadata about the crawl target.
- * @returns {Promise}
+ * @returns {Promise<void>}
  */
 exports.crawlSite = async function (archive, crawlSource) {
   return doCrawl(archive, crawlSource, 'crawl_followgraph', TABLE_VERSION, async ({changes, resetRequired}) => {
@@ -126,7 +122,7 @@ exports.crawlSite = async function (archive, crawlSource) {
  * @param {Object} [opts]
  * @param {string} [opts.followedBy] - (URL) filter results to those followed by the site specified with this param. Causes .followsUser boolean to be set.
  * @param {boolean} [opts.includeDesc] - output a site description instead of a simple URL.
- * @returns {(Promise<Array<string>>|Promise<Array<SiteDescriptionWithFollowData>>)}
+ * @returns {Promise<Array<string|SiteDescription>>}
  */
 const listFollowers = exports.listFollowers = async function (subject, {followedBy, includeDesc} = {}) {
   var rows
@@ -173,7 +169,7 @@ const listFollowers = exports.listFollowers = async function (subject, {followed
  * @param {string} [opts.followedBy] - (URL) filter results to those followed by the site specified with this param. Causes .followsUser boolean to be set.
  * @param {boolean} [opts.includeDesc] - output a site description instead of a simple URL.
  * @param {boolean} [opts.includeFollowers] - include .followedBy in the result. Requires includeDesc to be true.
- * @returns {(Promise<Array<string>>|Promise<Array<SiteDescriptionWithFollowData>>)}
+ * @returns {Promise<Array<SiteDescription | string>>}
  */
 const listFollows = exports.listFollows = async function (subject, {followedBy, includeDesc, includeFollowers} = {}) {
   var rows = await db.all(`
@@ -188,13 +184,13 @@ const listFollows = exports.listFollows = async function (subject, {followedBy,
   }
   return Promise.all(rows.map(async (row) => {
     var url = toOrigin(row.destUrl)
-    var desc = (await siteDescriptions.getBest({subject: url, author: subject})) || {}
+    var desc = /** @type SiteDescription */ ((await siteDescriptions.getBest({subject: url, author: subject})) || {})
     desc.url = url
     if (followedBy) {
       desc.followsUser = await isAFollowingB(url, followedBy)
     }
     if (includeFollowers) {
-      desc.followedBy = await listFollowers(url, {followedBy, includeDesc: true})
+      desc.followedBy = /** @type Array<SiteDescription> */ (await listFollowers(url, {followedBy, includeDesc: true}))
     }
     return desc
   }))
@@ -207,15 +203,15 @@ const listFollows = exports.listFollows = async function (subject, {followedBy,
  * @param {string} subject - (URL)
  * @param {Object} [opts]
  * @param {string} [opts.followedBy] - (URL) filter results to those followed by the site specified with this param. Causes .followsUser boolean to be set.
- * @returns {Promise<Array<SiteDescriptionWithFollowData>>}
+ * @returns {Promise<Array<SiteDescription>>}
  */
 const listFoaFs = exports.listFoaFs = async function (subject, {followedBy} = {}) {
   var foafs = []
   // list URLs followed by subject
-  var follows = await listFollows(subject, {followedBy, includeDesc: true})
+  var follows = /** @type Array<SiteDescription> */ (await listFollows(subject, {followedBy, includeDesc: true}))
   for (let follow of follows) {
     // list follows of this follow
-    for (let foaf of await listFollows(follow.url, {followedBy, includeDesc: true})) {
+    for (let foaf of /** @type Array<SiteDescription> */ (await listFollows(follow.url, {followedBy, includeDesc: true}))) {
       // ignore if followed by subject or is subject
       if (foaf.url === subject) continue
       if (follows.find(v => v.url === foaf.url)) continue
@@ -260,7 +256,7 @@ const isAFollowingB = exports.isAFollowingB = async function (a, b) {
  *
  * @param {InternalDatArchive} archive
  * @param {string} followUrl
- * @returns {Promise}
+ * @returns {Promise<void>}
  */
 exports.follow = async function (archive, followUrl) {
   // normalize followUrl
@@ -284,7 +280,7 @@ exports.follow = async function (archive, followUrl) {
  *
  * @param {InternalDatArchive} archive
  * @param {string} followUrl
- * @returns {Promise}
+ * @returns {Promise<void>}
  */
 exports.unfollow = async function (archive, followUrl) {
   // normalize followUrl
@@ -309,8 +305,8 @@ exports.unfollow = async function (archive, followUrl) {
  */
 function toOrigin (url) {
   try {
-    url = new URL(url)
-    return url.protocol + '//' + url.hostname
+    var urlParsed = new URL(url)
+    return urlParsed.protocol + '//' + urlParsed.hostname
   } catch (e) {
     return null
   }
@@ -337,8 +333,8 @@ async function readFollowsFile (archive) {
 
 /**
  * @param {InternalDatArchive} archive
- * @param {(Object) => undefined} updateFn
- * @returns {Promise}
+ * @param {function(Object): void} updateFn
+ * @returns {Promise<void>}
  */
 async function updateFollowsFile (archive, updateFn) {
   var release = await lock('crawler:followgraph:' + archive.url)
diff --git a/crawler/posts.js b/crawler/posts.js
index c5e33378..eaa291a2 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -18,8 +18,9 @@ const JSON_PATH_REGEX = /^\/data\/posts\/([^/]+)\.json$/i
 // =
 
 /**
- * @typedef CrawlSourceRecord {import('./util').CrawlSourceRecord}
- * @typedef SiteDescription { import("./site-descriptions").SiteDescription }
+ * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
+ * @typedef {import('./util').CrawlSourceRecord} CrawlSourceRecord
+ * @typedef { import("./site-descriptions").SiteDescription } SiteDescription
  *
  * @typedef {Object} Post
  * @prop {string} pathname
@@ -196,11 +197,12 @@ exports.list = async function ({offset, limit, reverse, author, authors} = {}) {
  */
 const get = exports.get = async function (url, pathname = undefined) {
   // validate & parse params
+  var urlParsed
   if (url) {
-    try { url = new URL(url) }
+    try { urlParsed = new URL(url) }
     catch (e) { throw new Error('Failed to parse post URL: ' + url) }
   }
-  pathname = pathname || url.pathname
+  pathname = pathname || urlParsed.pathname
 
   // execute query
   return await massagePostRow(await db.get(`
@@ -212,7 +214,7 @@ const get = exports.get = async function (url, pathname = undefined) {
         AND src.url = ?
       WHERE
         crawl_posts.pathname = ?
-  `, [url.origin, pathname]))
+  `, [urlParsed.origin, pathname]))
 }
 
 /**
@@ -224,7 +226,7 @@ const get = exports.get = async function (url, pathname = undefined) {
  * @param {string} post.content
  * @returns {Promise}
  */
-exports.create = async function (archive, {content} = {}) {
+exports.create = async function (archive, {content}) {
   assert(typeof content === 'string', 'Create() must be provided a `content` string')
   var filename = generateTimeFilename()
   await ensureDirectory(archive, '/data')
@@ -247,7 +249,7 @@ exports.create = async function (archive, {content} = {}) {
  * @param {string} post.content
  * @returns {Promise}
  */
-exports.edit = async function (archive, pathname, {content} = {}) {
+exports.edit = async function (archive, pathname, {content}) {
   assert(typeof pathname === 'string', 'Edit() must be provided a valid URL string')
   assert(typeof content === 'string', 'Edit() must be provided a `content` string')
   var oldJson = JSON.parse(await archive.pda.readFile(pathname))
@@ -290,8 +292,8 @@ function isString (v) {
  * @returns {string}
  */
 function toOrigin (url) {
-  url = new URL(url)
-  return url.protocol + '//' + url.hostname
+  var urlParsed = new URL(url)
+  return urlParsed.protocol + '//' + urlParsed.hostname
 }
 
 /**
@@ -306,12 +308,11 @@ async function ensureDirectory (archive, pathname) {
 
 /**
  * @param {Object} row
- * @returns {Post}
+ * @returns {Promise<Post>}
  */
 async function massagePostRow (row) {
   if (!row) return null
   row.author = await siteDescriptions.getBest({subject: row.crawlSourceUrl})
-console.log('author for', row.author, row)
   if (!row.author) row.author = {url: row.crawlSourceUrl}
   delete row.crawlSourceUrl
   delete row.crawlSourceId
diff --git a/crawler/search.js b/crawler/search.js
index ffeeb2f5..f07f0eb7 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -25,7 +25,7 @@ const BUILTIN_PAGES = [
 // =
 
 /**
- * @typedef SiteDescription { import("./site-descriptions").SiteDescription }
+ * @typedef {import("./site-descriptions").SiteDescription} SiteDescription
  *
  * @typedef {Object} SuggestionResults
  * @prop {Array<Object>} apps
diff --git a/crawler/site-descriptions.js b/crawler/site-descriptions.js
index 91dafd26..0b865875 100644
--- a/crawler/site-descriptions.js
+++ b/crawler/site-descriptions.js
@@ -26,7 +26,8 @@ const JSON_PATH_REGEX = /^\/(dat\.json|data\/known_sites\/([^/]+)\/dat\.json)$/i
 // =
 
 /**
- * @typedef CrawlSourceRecord {import('./util').CrawlSourceRecord}
+ * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
+ * @typedef {import('./util').CrawlSourceRecord} CrawlSourceRecord
  *
  * @typedef {Object} SiteDescription
  * @prop {string} url
@@ -36,6 +37,8 @@ const JSON_PATH_REGEX = /^\/(dat\.json|data\/known_sites\/([^/]+)\/dat\.json)$/i
  * @prop {string} thumbUrl
  * @prop {Object} descAuthor
  * @prop {string} descAuthor.url
+ * @prop {boolean} [followsUser] - does this site follow the specified user site?
+ * @prop {Array<SiteDescription>} [followedBy] - list of sites following this site.
  */
 
 // globals
@@ -56,7 +59,7 @@ exports.removeListener = events.removeListener.bind(events)
  *
  * @param {InternalDatArchive} archive - site to crawl.
  * @param {CrawlSourceRecord} crawlSource - internal metadata about the crawl target.
- * @returns {Promise}
+ * @returns {Promise<void>}
  */
 exports.crawlSite = async function (archive, crawlSource) {
   return doCrawl(archive, crawlSource, 'crawl_site_descriptions', TABLE_VERSION, async ({changes, resetRequired}) => {
@@ -137,8 +140,8 @@ exports.crawlSite = async function (archive, crawlSource) {
  * List crawled site descriptions.
  *
  * @param {Object} [opts]
- * @param {string} [opts.subject] - (URL) filter descriptions to those which describe this subject.
- * @param {string} [opts.author] - (URL) filter descriptions to those created by this author.
+ * @param {string | Array<string>} [opts.subject] - (URL) filter descriptions to those which describe this subject.
+ * @param {string | Array<string>} [opts.author] - (URL) filter descriptions to those created by this author.
  * @param {number} [opts.offset]
  * @param {number} [opts.limit]
  * @param {boolean} [opts.reverse]
@@ -233,12 +236,15 @@ exports.getBest = async function ({subject, author} = {}) {
  * Capture a site description into the archive's known_sites cache.
  *
  * @param {InternalDatArchive} archive - where to write the capture to.
- * @param {(InternalDatArchive|string)} subjectArchive - which archive to capture.
+ * @param {(InternalDatArchive|string)} subject - which archive to capture.
  * @returns Promise
  */
-exports.capture = async function (archive, subjectArchive) {
-  if (typeof subjectArchive === 'string') {
-    subjectArchive = await dat.library.getOrLoadArchive(subjectArchive)
+exports.capture = async function (archive, subject) {
+  var subjectArchive
+  if (typeof subject === 'string') {
+    subjectArchive = await dat.library.getOrLoadArchive(subject)
+  } else {
+    subjectArchive = subject
   }
 
   // create directory
@@ -273,12 +279,15 @@ exports.capture = async function (archive, subjectArchive) {
  * Delete a captured site description in the given archive's known_sites cache.
  *
  * @param {InternalDatArchive} archive - where to remove the capture from.
- * @param {(InternalDatArchive|string)} subjectUrl - which archive's capture to remove.
+ * @param {(InternalDatArchive|string)} subject - which archive's capture to remove.
  * @returns Promise
  */
-exports.deleteCapture = async function (archive, subjectUrl) {
-  if (subjectUrl && subjectUrl.url) {
-    subjectUrl = subjectUrl.url
+exports.deleteCapture = async function (archive, subject) {
+  var subjectUrl
+  if (typeof subject === 'string') {
+    subjectUrl = subject
+  } else {
+    subjectUrl = subject.url
   }
   assert(typeof subjectUrl === 'string', 'Delete() must be provided a valid URL string')
   var hostname = toHostname(subjectUrl)
@@ -302,8 +311,8 @@ function isString (v) {
  * @returns {string}
  */
 function toOrigin (url) {
-  url = new URL(url)
-  return url.protocol + '//' + url.hostname
+  var urlParsed = new URL(url)
+  return urlParsed.protocol + '//' + urlParsed.hostname
 }
 
 /**
@@ -313,14 +322,14 @@ function toOrigin (url) {
  */
 function getUrlFromDescriptionPath (archive, name) {
   if (name === '/dat.json') return archive.url
-  name = name.split('/') // '/data/known_sites/{hostname}/dat.json' -> ['', 'data', 'known_sites', hostname, 'dat.json']
-  return 'dat://' + name[3]
+  var parts = name.split('/') // '/data/known_sites/{hostname}/dat.json' -> ['', 'data', 'known_sites', hostname, 'dat.json']
+  return 'dat://' + parts[3]
 }
 
 /**
  * @param {InternalDatArchive} archive
  * @param {string} pathname
- * @returns {Promise}
+ * @returns {Promise<void>}
  */
 async function ensureDirectory (archive, pathname) {
   try { await archive.pda.mkdir(pathname) }
@@ -330,7 +339,7 @@ async function ensureDirectory (archive, pathname) {
 /**
  * @param {InternalDatArchive} archive
  * @param {string} pathname
- * @returns {Promise}
+ * @returns {Promise<boolean>}
  */
 async function fileExists (archive, pathname) {
   try { await archive.pda.stat(pathname) }
diff --git a/crawler/util.js b/crawler/util.js
index 657e0d6f..8e292f1e 100644
--- a/crawler/util.js
+++ b/crawler/util.js
@@ -10,6 +10,8 @@ const READ_TIMEOUT = 30e3
 // =
 
 /**
+ * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
+ * 
  * @typedef {Object} CrawlSourceRecord
  * @prop {string} id
  * @prop {string} url
@@ -26,7 +28,7 @@ exports.crawlerEvents = crawlerEvents
  * @param {CrawlSourceRecord} crawlSource
  * @param {string} crawlDataset
  * @param {number} crawlDatasetVersion
- * @param {(Object) => undefined} handlerFn
+ * @param {function(Object): Promise<void>} handlerFn
  * @returns {Promise}
  */
 exports.doCrawl = async function (archive, crawlSource, crawlDataset, crawlDatasetVersion, handlerFn) {
@@ -135,8 +137,8 @@ exports.generateTimeFilename = function () {
  */
 const toHostname =
 exports.toHostname = function (url) {
-  url = new URL(url)
-  return url.hostname
+  var urlParsed = new URL(url)
+  return urlParsed.hostname
 }
 
 /**
diff --git a/dat/library.js b/dat/library.js
index 3c0af69c..d7b8fd46 100644
--- a/dat/library.js
+++ b/dat/library.js
@@ -26,6 +26,49 @@ const {
 const {InvalidURLError} = require('beaker-error-constants')
 const DAT_DAEMON_MANIFEST = require('./daemon/manifest')
 
+// typedefs
+// =
+
+/**
+ * @typedef {Object} InternalDatArchive
+ * @prop {Buffer} key
+ * @prop {string} url
+ * @prop {Buffer} discoveryKey
+ * @prop {boolean} writable
+ * @prop {function(Function): void} ready
+ * @prop {function(Object, Function=): void} download
+ * @prop {function(Object=): ReadableStream} history
+ * @prop {function(Object=): ReadableStream} createReadStream
+ * @prop {function(string, Object=, Function=): any} readFile
+ * @prop {function(number, Object=): ReadableStream} createDiffStream
+ * @prop {function(string, Object=): WritableStream} createWriteStream
+ * @prop {function(string, any, Object=, Function=): void} writeFile
+ * @prop {function(string, Function=): void} unlink
+ * @prop {function(string, Object=, Function=): void} mkdir
+ * @prop {function(string, Function=): void} rmdir
+ * @prop {function(string, Object=, Function=): void} readdir
+ * @prop {function(string, Object=, Function=): void} stat
+ * @prop {function(string, Object=, Function=): void} lstat
+ * @prop {function(string, Object=, Function=): void} access
+ * @prop {Object} pda
+ * @prop {function(string): Promise<Object>} pda.stat
+ * @prop {function(string, Object=): Promise<any>} pda.readFile
+ * @prop {function(string, Object=): Promise<Array<Object>>} pda.readdir
+ * @prop {function(string): Promise<number>} pda.readSize
+ * @prop {function(string, any, Object=): Promise<void>} pda.writeFile
+ * @prop {function(string): Promise<void>} pda.mkdir
+ * @prop {function(string, string): Promise<void>} pda.copy
+ * @prop {function(string, string): Promise<void>} pda.rename
+ * @prop {function(string): Promise<void>} pda.unlink
+ * @prop {function(string, Object=): Promise<void>} pda.rmdir
+ * @prop {function(string=): Promise<void>} pda.download
+ * @prop {function(string=): ReadableStream} pda.watch
+ * @prop {function(): ReadableStream} pda.createNetworkActivityStream
+ * @prop {function(): Promise<Object>} pda.readManifest
+ * @prop {function(Object): Promise<void>} pda.writeManifest
+ * @prop {function(Object): Promise<void>} pda.updateManifest
+ */
+
 // globals
 // =
 

From 53ae755938c4a45786813e4cc68d76917e1598fc Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 13 Jan 2019 15:04:32 -0600
Subject: [PATCH 056/245] Add jsdocs to the database scripts

---
 crawler/followgraph.js   |   2 +-
 crawler/search.js        |  15 +-
 crawler/util.js          |   2 +-
 dbs/archives.js          | 310 +++++++++++++++++++++++++++++----------
 dbs/bookmarks.js         |  91 ++++++++++--
 dbs/history.js           |  63 +++++++-
 dbs/profile-data-db.js   |  22 +++
 dbs/settings.js          |  25 +++-
 dbs/sitedata.js          |  88 ++++++++---
 dbs/templates.js         |  41 ++++++
 dbs/watchlist.js         |  43 +++++-
 lib/db.js                |   8 +-
 lib/env.js               |   4 +
 web-apis/bg/watchlist.js |   4 +-
 14 files changed, 590 insertions(+), 128 deletions(-)

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index e1124bfd..6b27c6b8 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -75,7 +75,7 @@ exports.crawlSite = async function (archive, crawlSource) {
     }
 
     // diff against the current follows
-    var currentFollows = await listFollows(archive.url)
+    var currentFollows = /** @type string[] */(await listFollows(archive.url))
     var newFollows = followsJson.urls
     var adds = _difference(newFollows, currentFollows)
     var removes = _difference(currentFollows, newFollows)
diff --git a/crawler/search.js b/crawler/search.js
index f07f0eb7..e788c34c 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -26,6 +26,7 @@ const BUILTIN_PAGES = [
 
 /**
  * @typedef {import("./site-descriptions").SiteDescription} SiteDescription
+ * @typedef {import("../dbs/archives").LibraryArchiveRecord} LibraryArchiveRecord
  *
  * @typedef {Object} SuggestionResults
  * @prop {Array<Object>} apps
@@ -82,14 +83,14 @@ exports.listSuggestions = async function (query = '', opts = {}) {
   suggestions.apps = BUILTIN_PAGES.filter(filterFn)
 
   // library
-  var libraryResults = await datLibrary.queryArchives({isSaved: true})
+  var libraryResults = /** @type LibraryArchiveRecord[] */(await datLibrary.queryArchives({isSaved: true}))
   libraryResults = libraryResults.filter(filterFn)
-  libraryResults = _groupBy(libraryResults, a => getBasicType(a.type))
-  suggestions.people = libraryResults.user
-  suggestions.webPages = libraryResults['web-page']
-  suggestions.fileShares = libraryResults['file-share']
-  suggestions.imageCollections = libraryResults['image-collection']
-  suggestions.others = libraryResults.other
+  var libraryResultsGrouped = _groupBy(libraryResults, a => getBasicType(a.type))
+  suggestions.people = libraryResultsGrouped.user
+  suggestions.webPages = libraryResultsGrouped['web-page']
+  suggestions.fileShares = libraryResultsGrouped['file-share']
+  suggestions.imageCollections = libraryResultsGrouped['image-collection']
+  suggestions.others = libraryResultsGrouped.other
 
   if (query) {
     // bookmarks
diff --git a/crawler/util.js b/crawler/util.js
index 8e292f1e..6e0dae76 100644
--- a/crawler/util.js
+++ b/crawler/util.js
@@ -11,7 +11,7 @@ const READ_TIMEOUT = 30e3
 
 /**
  * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
- * 
+ *
  * @typedef {Object} CrawlSourceRecord
  * @prop {string} id
  * @prop {string} url
diff --git a/dbs/archives.js b/dbs/archives.js
index 85433822..67df8bc5 100644
--- a/dbs/archives.js
+++ b/dbs/archives.js
@@ -12,38 +12,128 @@ const {
   DAT_GC_EXPIRATION_AGE
 } = require('../lib/const')
 
+// typedefs
+// =
+
+/**
+ * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
+ *
+ * @typedef {Object} LibraryArchiveRecord
+ * @prop {string} key
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {Array<string>} type
+ * @prop {number} mtime
+ * @prop {number} size
+ * @prop {boolean} isOwner
+ * @prop {number} lastAccessTime
+ * @prop {number} lastLibraryAccessTime
+ * @prop {Object} userSettings
+ * @prop {boolean} userSettings.isSaved
+ * @prop {boolean} userSettings.hidden
+ * @prop {boolean} userSettings.networked
+ * @prop {boolean} userSettings.autoDownload
+ * @prop {boolean} userSettings.autoUpload
+ * @prop {number} userSettings.expiresAt
+ * @prop {string} userSettings.localSyncPath
+ * @prop {boolean} userSettings.previewMode
+ *
+ * @typedef {Object} LibraryArchiveMeta
+ * @prop {string} key
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {string | Array<string>} type
+ * @prop {Array<string>} installedNames
+ * @prop {number} mtime
+ * @prop {number} size
+ * @prop {boolean} isOwner
+ * @prop {number} lastAccessTime
+ * @prop {number} lastLibraryAccessTime
+ *
+ * @typedef {Object} LibraryArchiveUserSettings
+ * @prop {number} profileId
+ * @prop {string} key
+ * @prop {boolean} isSaved
+ * @prop {boolean} hidden
+ * @prop {boolean} networked
+ * @prop {boolean} autoDownload
+ * @prop {boolean} autoUpload
+ * @prop {number} expiresAt
+ * @prop {string} localSyncPath
+ * @prop {boolean} previewMode
+ * @prop {number} createdAt
+ *
+ * @typedef {Object} MinimalLibraryArchiveRecord
+ * @prop {string} key
+ */
+
 // globals
 // =
 
-var datPath // path to the dat folder
+var datPath /** @type string - path to the dat folder */
 var events = new Events()
 
 // exported methods
 // =
 
+/**
+ * @param {Object} opts
+ * @param {string} opts.userDataPath
+ */
 exports.setup = function (opts) {
   // make sure the folders exist
   datPath = path.join(opts.userDataPath, 'Dat')
   mkdirp.sync(path.join(datPath, 'Archives'))
 }
 
+/**
+ * @returns {string}
+ */
 exports.getDatPath = function () {
   return datPath
 }
 
-// get the path to an archive's files
+/**
+ * @description Get the path to an archive's files.
+ * @param {string | Buffer | InternalDatArchive} archiveOrKey
+ * @returns {string}
+ */
+//
 const getArchiveMetaPath = exports.getArchiveMetaPath = function (archiveOrKey) {
-  var key = datEncoding.toStr(archiveOrKey.key || archiveOrKey)
+  var key /** @type string */
+  if (typeof archiveOrKey === 'string') {
+    key = archiveOrKey
+  } else if (Buffer.isBuffer(archiveOrKey)) {
+    key = datEncoding.toStr(archiveOrKey)
+  } else {
+    key = datEncoding.toStr(archiveOrKey.key)
+  }
   return path.join(datPath, 'Archives', 'Meta', key.slice(0, 2), key.slice(2))
 }
 
-// get the path to an archive's temporary local sync path
+/**
+ * @description Get the path to an archive's temporary local sync path.
+ * @param {string | Buffer | InternalDatArchive} archiveOrKey
+ * @returns {string}
+ */
 const getInternalLocalSyncPath = exports.getInternalLocalSyncPath = function (archiveOrKey) {
-  var key = datEncoding.toStr(archiveOrKey.key || archiveOrKey)
+  var key /** @type string */
+  if (typeof archiveOrKey === 'string') {
+    key = archiveOrKey
+  } else if (Buffer.isBuffer(archiveOrKey)) {
+    key = datEncoding.toStr(archiveOrKey)
+  } else {
+    key = datEncoding.toStr(archiveOrKey.key)
+  }
   return path.join(datPath, 'Archives', 'LocalCopy', key.slice(0, 2), key.slice(2))
 }
 
-// delete all db entries and files for an archive
+/**
+ * @description Delete all db entries and files for an archive.
+ * @param {string} key
+ * @returns {Promise<number>}
+ */
 exports.deleteArchive = async function (key) {
   const path = getArchiveMetaPath(key)
   const info = await jetpack.inspectTreeAsync(path)
@@ -64,40 +154,42 @@ exports.removeListener = events.removeListener.bind(events)
 // exported methods: archive user settings
 // =
 
-// get an array of saved archives
-// - optional `query` keys:
-//   - `isSaved`: bool
-//   - `isNetworked`: bool
-//   - `isOwner`: bool, does beaker have the secret key?
-//   - `type`: string, a type filter
-//   - `showHidden`: bool, show hidden dats
-//   - `key`: string, the key of the archive you want (return single result)
-exports.query = async function (profileId, query) {
-  query = query || {}
-
+/**
+ * @description Get an array of saved archives.
+ * @param {number} profileId
+ * @param {Object} [query]
+ * @param {string} [query.key]
+ * @param {boolean} [query.isSaved]
+ * @param {boolean} [query.isNetworked]
+ * @param {boolean} [query.isOwner]
+ * @param {boolean} [query.showHidden]
+ * @param {string} [query.type]
+ * @param {string} [query.string]
+ * @returns {Promise<LibraryArchiveRecord|Array<LibraryArchiveRecord>>}
+ */
+exports.query = async function (profileId, query = {}) {
   // fetch archive meta
   var values = []
-  var WHERE = []
-  if (query.isOwner === true) WHERE.push('archives_meta.isOwner = 1')
-  if (query.isOwner === false) WHERE.push('archives_meta.isOwner = 0')
-  if (query.isNetworked === true) WHERE.push('archives.networked = 1')
-  if (query.isNetworked === false) WHERE.push('archives.networked = 0')
+  var whereList = []
+  if (query.isOwner === true) whereList.push('archives_meta.isOwner = 1')
+  if (query.isOwner === false) whereList.push('archives_meta.isOwner = 0')
+  if (query.isNetworked === true) whereList.push('archives.networked = 1')
+  if (query.isNetworked === false) whereList.push('archives.networked = 0')
   if ('isSaved' in query) {
     if (query.isSaved) {
-      WHERE.push('archives.profileId = ?')
+      whereList.push('archives.profileId = ?')
       values.push(profileId)
-      WHERE.push('archives.isSaved = 1')
+      whereList.push('archives.isSaved = 1')
     } else {
-      WHERE.push('(archives.isSaved = 0 OR archives.isSaved IS NULL)')
+      whereList.push('(archives.isSaved = 0 OR archives.isSaved IS NULL)')
     }
   }
-  if ('key' in query) {
-    WHERE.push('archives_meta.key = ?')
+  if (typeof query.key !== 'undefined') {
+    whereList.push('archives_meta.key = ?')
     values.push(query.key)
   }
-  if (!query.showHidden) WHERE.push('(archives.hidden = 0 OR archives.hidden IS NULL)')
-  if (WHERE.length) WHERE = `WHERE ${WHERE.join(' AND ')}`
-  else WHERE = ''
+  if (!query.showHidden) whereList.push('(archives.hidden = 0 OR archives.hidden IS NULL)')
+  var WHERE = whereList.length ? `WHERE ${whereList.join(' AND ')}` : ''
 
   var archives = await db.all(`
     SELECT
@@ -156,7 +248,7 @@ exports.query = async function (profileId, query) {
   // apply manual filters
   if ('type' in query) {
     let types = Array.isArray(query.type) ? query.type : [query.type]
-    archives = archives.filter(a => {
+    archives = archives.filter((/** @type LibraryArchiveRecord */ a) => {
       for (let type of types) {
         if (a.type.indexOf(type) === -1) {
           return false
@@ -169,7 +261,10 @@ exports.query = async function (profileId, query) {
   return ('key' in query) ? archives[0] : archives
 }
 
-// get all archives that should be unsaved
+/**
+ * @description Get all archives that should be unsaved.
+ * @returns {Promise<Array<MinimalLibraryArchiveRecord>>}
+ */
 exports.listExpiredArchives = async function () {
   return db.all(`
     SELECT archives.key
@@ -182,10 +277,16 @@ exports.listExpiredArchives = async function () {
   `, [Date.now()])
 }
 
-// get all archives that are ready for garbage collection
+/**
+ * @description Get all archives that are ready for garbage collection.
+ * @param {Object} [opts]
+ * @param {number} [opts.olderThan]
+ * @param {boolean} [opts.isOwner]
+ * @returns {Promise<Array<MinimalLibraryArchiveRecord>>}
+ */
 exports.listGarbageCollectableArchives = async function ({olderThan, isOwner} = {}) {
   olderThan = typeof olderThan === 'number' ? olderThan : DAT_GC_EXPIRATION_AGE
-  isOwner = typeof isOwner === 'boolean' ? `AND archives_meta.isOwner = ${isOwner ? '1' : '0'}` : ''
+  var isOwnerClause = typeof isOwner === 'boolean' ? `AND archives_meta.isOwner = ${isOwner ? '1' : '0'}` : ''
 
   // fetch archives
   var records = await db.all(`
@@ -195,7 +296,7 @@ exports.listGarbageCollectableArchives = async function ({olderThan, isOwner} =
       WHERE
         (archives.isSaved != 1 OR archives.isSaved IS NULL)
         AND archives_meta.lastAccessTime < ?
-        ${isOwner}
+        ${isOwnerClause}
   `, [Date.now() - olderThan])
   var records2 = records.slice()
 
@@ -208,7 +309,13 @@ exports.listGarbageCollectableArchives = async function ({olderThan, isOwner} =
   return records
 }
 
-// upsert the last-access time
+/**
+ * @description Upsert the last-access time.
+ * @param {string | Buffer} key
+ * @param {string} [timeVar]
+ * @param {number} [value]
+ * @returns {Promise<void>}
+ */
 exports.touch = async function (key, timeVar = 'lastAccessTime', value = -1) {
   var release = await lock('archives-db:meta')
   try {
@@ -216,22 +323,28 @@ exports.touch = async function (key, timeVar = 'lastAccessTime', value = -1) {
       timeVar = 'lastAccessTime'
     }
     if (value === -1) value = Date.now()
-    key = datEncoding.toStr(key)
-    await db.run(`UPDATE archives_meta SET ${timeVar}=? WHERE key=?`, [value, key])
-    await db.run(`INSERT OR IGNORE INTO archives_meta (key, ${timeVar}) VALUES (?, ?)`, [key, value])
+    var keyStr = datEncoding.toStr(key)
+    await db.run(`UPDATE archives_meta SET ${timeVar}=? WHERE key=?`, [value, keyStr])
+    await db.run(`INSERT OR IGNORE INTO archives_meta (key, ${timeVar}) VALUES (?, ?)`, [keyStr, value])
   } finally {
     release()
   }
 }
 
-// get a single archive's user settings
-// - supresses a not-found with an empty object
+/**
+ * @description
+ * Get a single archive's user settings.
+ * (Returns an empty object on not found.)
+ * @param {number} profileId
+ * @param {string | Buffer} key
+ * @returns {Promise<LibraryArchiveUserSettings>}
+ */
 const getUserSettings = exports.getUserSettings = async function (profileId, key) {
   // massage inputs
-  key = typeof key !== 'string' ? datEncoding.toStr(key) : key
+  var keyStr = typeof key !== 'string' ? datEncoding.toStr(key) : key
 
   // validate inputs
-  if (!DAT_HASH_REGEX.test(key)) {
+  if (!DAT_HASH_REGEX.test(keyStr)) {
     throw new InvalidArchiveKeyError()
   }
 
@@ -239,39 +352,53 @@ const getUserSettings = exports.getUserSettings = async function (profileId, key
   try {
     var settings = await db.get(`
       SELECT * FROM archives WHERE profileId = ? AND key = ?
-    `, [profileId, key])
+    `, [profileId, keyStr])
     settings.isSaved = !!settings.isSaved
     settings.hidden = !!settings.hidden
     settings.networked = !!settings.networked
     settings.autoDownload = !!settings.autoDownload
     settings.autoUpload = !!settings.autoUpload
-    settings.previewMode = settings.previewMode == 1
-    return settings
+    settings.previewMode = Number(settings.previewMode) === 1
+    return /** @type LibraryArchiveUserSettings */(settings)
   } catch (e) {
-    return {}
+    return /** @type LibraryArchiveUserSettings */({})
   }
 }
 
-// write an archive's user setting
+/**
+ * @description Write an archive's user setting.
+ * @param {number} profileId
+ * @param {string | Buffer} key
+ * @param {Object} [newValues]
+ * @param {boolean} [newValues.isSaved]
+ * @param {boolean} [newValues.hidden]
+ * @param {boolean} [newValues.networked]
+ * @param {boolean} [newValues.autoDownload]
+ * @param {boolean} [newValues.autoUpload]
+ * @param {number} [newValues.expiresAt]
+ * @param {string} [newValues.localSyncPath]
+ * @param {boolean} [newValues.previewMode]
+ * @returns {Promise<LibraryArchiveUserSettings>}
+ */
 exports.setUserSettings = async function (profileId, key, newValues = {}) {
   // massage inputs
-  key = datEncoding.toStr(key)
+  var keyStr = datEncoding.toStr(key)
 
   // validate inputs
-  if (!DAT_HASH_REGEX.test(key)) {
+  if (!DAT_HASH_REGEX.test(keyStr)) {
     throw new InvalidArchiveKeyError()
   }
 
   var release = await lock('archives-db')
   try {
     // fetch current
-    var value = await getUserSettings(profileId, key)
+    var value = await getUserSettings(profileId, keyStr)
 
     if (!value || typeof value.key === 'undefined') {
       // create
-      value = {
+      value = /** @type LibraryArchiveUserSettings */ ({
         profileId,
-        key,
+        key: keyStr,
         isSaved: newValues.isSaved,
         hidden: newValues.hidden,
         networked: ('networked' in newValues) ? newValues.networked : true,
@@ -280,10 +407,10 @@ exports.setUserSettings = async function (profileId, key, newValues = {}) {
         expiresAt: newValues.expiresAt,
         localSyncPath: (newValues.localSyncPath) ? newValues.localSyncPath : '',
         previewMode: ('previewMode' in newValues) ? newValues.previewMode : ''
-      }
+      })
       let valueArray = [
         profileId,
-        key,
+        keyStr,
         flag(value.isSaved),
         flag(value.hidden),
         flag(value.networked),
@@ -330,7 +457,7 @@ exports.setUserSettings = async function (profileId, key, newValues = {}) {
         value.localSyncPath,
         flag(value.previewMode),
         profileId,
-        key
+        keyStr
       ]
       await db.run(`
         UPDATE archives
@@ -348,7 +475,7 @@ exports.setUserSettings = async function (profileId, key, newValues = {}) {
       `, valueArray)
     }
 
-    events.emit('update:archive-user-settings', key, value, newValues)
+    events.emit('update:archive-user-settings', keyStr, value, newValues)
     return value
   } finally {
     release()
@@ -358,14 +485,19 @@ exports.setUserSettings = async function (profileId, key, newValues = {}) {
 // exported methods: archive meta
 // =
 
-// get a single archive's metadata
-// - supresses a not-found with an empty object
+/**
+ * @description
+ * Get a single archive's metadata.
+ * Returns an empty object on not-found.
+ * @param {string | Buffer} key
+ * @returns {Promise<LibraryArchiveMeta>}
+ */
 const getMeta = exports.getMeta = async function (key) {
   // massage inputs
-  key = typeof key !== 'string' ? datEncoding.toStr(key) : key
+  var keyStr = typeof key !== 'string' ? datEncoding.toStr(key) : key
 
   // validate inputs
-  if (!DAT_HASH_REGEX.test(key)) {
+  if (!DAT_HASH_REGEX.test(keyStr)) {
     throw new InvalidArchiveKeyError()
   }
 
@@ -380,9 +512,9 @@ const getMeta = exports.getMeta = async function (key) {
       LEFT JOIN apps ON apps.url = ('dat://' || archives_meta.key)
       WHERE archives_meta.key = ?
       GROUP BY archives_meta.key
-  `, [key])
+  `, [keyStr])
   if (!meta) {
-    return defaultMeta(key)
+    return defaultMeta(keyStr)
   }
 
   // massage some values
@@ -401,15 +533,23 @@ const getMeta = exports.getMeta = async function (key) {
   return meta
 }
 
-// write an archive's metadata
-exports.setMeta = async function (key, value = {}) {
+/**
+ * @description Write an archive's metadata.
+ * @param {string | Buffer} key
+ * @param {LibraryArchiveMeta} [value]
+ * @returns {Promise<void>}
+ */
+exports.setMeta = async function (key, value) {
   // massage inputs
-  key = datEncoding.toStr(key)
+  var keyStr = datEncoding.toStr(key)
 
   // validate inputs
-  if (!DAT_HASH_REGEX.test(key)) {
+  if (!DAT_HASH_REGEX.test(keyStr)) {
     throw new InvalidArchiveKeyError()
   }
+  if (!value || typeof value !== 'object') {
+    return // dont bother
+  }
 
   // extract the desired values
   var {title, description, type, size, mtime, isOwner} = value
@@ -417,30 +557,35 @@ exports.setMeta = async function (key, value = {}) {
   description = typeof description === 'string' ? description : ''
   if (typeof type === 'string') type = type.split(' ')
   else if (Array.isArray(type)) type = type.filter(v => v && typeof v === 'string')
-  isOwner = flag(isOwner)
+  var isOwnerFlag = flag(isOwner)
 
   // write
   var release = await lock('archives-db:meta')
-  var {lastAccessTime, lastLibraryAccessTime} = await getMeta(key)
+  var {lastAccessTime, lastLibraryAccessTime} = await getMeta(keyStr)
   try {
     await db.run(`
       INSERT OR REPLACE INTO
         archives_meta (key, title, description, mtime, size, isOwner, lastAccessTime, lastLibraryAccessTime)
         VALUES        (?,   ?,     ?,           ?,     ?,    ?,       ?,              ?)
-    `, [key, title, description, mtime, size, isOwner, lastAccessTime, lastLibraryAccessTime])
-    await db.run(`DELETE FROM archives_meta_type WHERE key=?`, key)
+    `, [keyStr, title, description, mtime, size, isOwnerFlag, lastAccessTime, lastLibraryAccessTime])
+    await db.run(`DELETE FROM archives_meta_type WHERE key=?`, keyStr)
     if (type) {
       await Promise.all(type.map(t => (
-        db.run(`INSERT INTO archives_meta_type (key, type) VALUES (?, ?)`, [key, t])
+        db.run(`INSERT INTO archives_meta_type (key, type) VALUES (?, ?)`, [keyStr, t])
       )))
     }
   } finally {
     release()
   }
-  events.emit('update:archive-meta', key, value)
+  events.emit('update:archive-meta', keyStr, value)
 }
 
-// find the archive currently using a given localSyncPath
+/**
+ * @description Find the archive currently using a given localSyncPath.
+ * @param {number} profileId
+ * @param {string} localSyncPath
+ * @returns {Promise<MinimalLibraryArchiveRecord | null>}
+ */
 exports.getByLocalSyncPath = async function (profileId, localSyncPath) {
   try {
     return await db.get(`
@@ -454,24 +599,37 @@ exports.getByLocalSyncPath = async function (profileId, localSyncPath) {
 // internal methods
 // =
 
+/**
+ * @param {string} key
+ * @returns {LibraryArchiveMeta}
+ */
 function defaultMeta (key) {
   return {
     key,
     title: null,
     description: null,
     type: [],
-    author: null,
     mtime: 0,
     isOwner: false,
     lastAccessTime: 0,
-    installedNames: []
+    lastLibraryAccessTime: 0,
+    installedNames: [],
+    size: 0
   }
 }
 
+/**
+ * @param {boolean} b
+ * @returns {number}
+ */
 function flag (b) {
   return b ? 1 : 0
 }
 
+/**
+ * @param {string} originURL
+ * @returns {string}
+ */
 exports.extractOrigin = function (originURL) {
   var urlp = url.parse(originURL)
   if (!urlp || !urlp.host || !urlp.protocol) return
diff --git a/dbs/bookmarks.js b/dbs/bookmarks.js
index da53524d..62081f2b 100644
--- a/dbs/bookmarks.js
+++ b/dbs/bookmarks.js
@@ -5,15 +5,41 @@ const lock = require('../lib/lock')
 const NORMALIZE_OPTS = {
   stripFragment: false,
   stripWWW: false,
-  removeQueryParameters: false,
   removeTrailingSlash: false
 }
 
+// typedefs
+// =
+
+/**
+ * @typedef {Object} Bookmark
+ * @prop {boolean} _origin
+ * @prop {boolean} _url
+ * @prop {boolean} private
+ * @prop {number} createdAt
+ * @prop {string} href
+ * @prop {string} title
+ * @prop {string[]} tags
+ * @prop {string} notes
+ * @prop {boolean} pinned
+ * @prop {number} pinOrder
+ */
+
 // exported methods
 // =
 
+/**
+ * @param {number} profileId
+ * @param {string} url
+ * @param {Object} values
+ * @param {string} values.title
+ * @param {string | string[]} values.tags
+ * @param {string} values.notes
+ * @param {number} values.pinOrder
+ * @returns {Promise<void>}
+ */
 exports.bookmark = async function (profileId, url, {title, tags, notes, pinOrder}) {
-  tags = tagsToString(tags)
+  var tagsStr = tagsToString(tags)
   var release = await lock(`bookmark:${url}`)
   try {
     // read old bookmark and fallback to old values as needed
@@ -21,7 +47,7 @@ exports.bookmark = async function (profileId, url, {title, tags, notes, pinOrder
     oldBookmark = oldBookmark || {}
     const pinned = oldBookmark.pinned ? 1 : 0
     title = typeof title === 'undefined' ? oldBookmark.title : title
-    tags = typeof tags === 'undefined' ? oldBookmark.tags : tags
+    tagsStr = typeof tagsStr === 'undefined' ? oldBookmark.tags : tagsStr
     notes = typeof notes === 'undefined' ? oldBookmark.notes : notes
     pinOrder = typeof pinOrder === 'undefined' ? oldBookmark.pinOrder : pinOrder
 
@@ -30,20 +56,36 @@ exports.bookmark = async function (profileId, url, {title, tags, notes, pinOrder
       INSERT OR REPLACE
         INTO bookmarks (profileId, url, title, tags, notes, pinned, pinOrder)
         VALUES (?, ?, ?, ?, ?, ?, ?)
-    `, [profileId, url, title, tags, notes, pinned, pinOrder])
+    `, [profileId, url, title, tagsStr, notes, pinned, pinOrder])
   } finally {
     release()
   }
 }
 
+/**
+ * @param {number} profileId
+ * @param {string} url
+ * @returns {Promise<void>}
+ */
 exports.unbookmark = function (profileId, url) {
   return db.run(`DELETE FROM bookmarks WHERE profileId = ? AND url = ?`, [profileId, url])
 }
 
+/**
+ * @param {number} profileId
+ * @param {string} url
+ * @param {boolean} pinned
+ * @returns {Promise<void>}
+ */
 exports.setBookmarkPinned = function (profileId, url, pinned) {
   return db.run(`UPDATE bookmarks SET pinned = ? WHERE profileId = ? AND url = ?`, [pinned ? 1 : 0, profileId, url])
 }
 
+/**
+ * @param {number} profileId
+ * @param {string[]} urls
+ * @returns {Promise<void>}
+ */
 exports.setBookmarkPinOrder = async function (profileId, urls) {
   var len = urls.length
   await Promise.all(urls.map((url, i) => (
@@ -51,10 +93,21 @@ exports.setBookmarkPinOrder = async function (profileId, urls) {
   )))
 }
 
+/**
+ * @param {number} profileId
+ * @param {string} url
+ * @returns {Promise<Bookmark>}
+ */
 exports.getBookmark = async function (profileId, url) {
   return toNewFormat(await db.get(`SELECT url, title, tags, notes, pinned, pinOrder, createdAt FROM bookmarks WHERE profileId = ? AND url = ?`, [profileId, url]))
 }
 
+/**
+ * @param {number} profileId
+ * @param {Object} [opts]
+ * @param {string} [opts.tag]
+ * @returns {Promise<Array<Bookmark>>}
+ */
 exports.listBookmarks = async function (profileId, {tag} = {}) {
   var bookmarks = await db.all(`SELECT url, title, tags, notes, pinned, pinOrder, createdAt FROM bookmarks WHERE profileId = ? ORDER BY createdAt DESC`, [profileId])
   bookmarks = bookmarks.map(toNewFormat)
@@ -73,11 +126,19 @@ exports.listBookmarks = async function (profileId, {tag} = {}) {
   return bookmarks
 }
 
+/**
+ * @param {number} profileId
+ * @returns {Promise<Array<Bookmark>>}
+ */
 exports.listPinnedBookmarks = async function (profileId) {
   var bookmarks = await db.all(`SELECT url, title, tags, notes, pinned, pinOrder, createdAt FROM bookmarks WHERE profileId = ? AND pinned = 1 ORDER BY pinOrder DESC`, [profileId])
   return bookmarks.map(toNewFormat)
 }
 
+/**
+ * @param {number} profileId
+ * @returns {Promise<Array<string>>}
+ */
 exports.listBookmarkTags = async function (profileId) {
   var tagSet = new Set()
   var bookmarks = await db.all(`SELECT tags FROM bookmarks WHERE profileId = ?`, [profileId])
@@ -89,10 +150,14 @@ exports.listBookmarkTags = async function (profileId) {
   return Array.from(tagSet)
 }
 
-// TEMP
-// apply normalization to old bookmarks
-// (can probably remove this in 2018 or so)
-// -prf
+/**
+ * @description
+ * TEMP
+ * apply normalization to old bookmarks
+ * (can probably remove this in 2018 or so)
+ * -prf
+ * @returns {Promise<void>}
+ */
 exports.fixOldBookmarks = async function () {
   var bookmarks = await db.all(`SELECT url FROM bookmarks`)
   bookmarks.forEach(b => {
@@ -101,6 +166,10 @@ exports.fixOldBookmarks = async function () {
   })
 }
 
+/**
+ * @param {string | string[]} v
+ * @returns {string}
+ */
 function tagsToString (v) {
   if (Array.isArray(v)) {
     v = v.join(' ')
@@ -108,8 +177,12 @@ function tagsToString (v) {
   return v
 }
 
+/**
+ * @param {Object} b
+ * @returns {Bookmark | null}
+ */
 function toNewFormat (b) {
-  if (!b) return b
+  if (!b) return null
   return {
     _origin: false,
     _url: false,
diff --git a/dbs/history.js b/dbs/history.js
index 7c17d457..aa2ed62a 100644
--- a/dbs/history.js
+++ b/dbs/history.js
@@ -1,7 +1,13 @@
 const lock = require('../lib/lock')
 const db = require('./profile-data-db')
 
+// typedefs
+// =
+
 class BadParamError extends Error {
+  /**
+   * @param {string} msg
+   */
   constructor (msg) {
     super()
     this.name = 'BadParamError'
@@ -9,9 +15,30 @@ class BadParamError extends Error {
   }
 }
 
+/**
+ * @typedef {Object} Visit
+ * @prop {number} profileId
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {number} ts
+ *
+ * @typedef {Object} VisitSearchResult
+ * @prop {string} offsets
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {number} num_visits
+ */
+
 // exported methods
 // =
 
+/**
+ * @param {number} profileId
+ * @param {Object} values
+ * @param {string} values.url
+ * @param {string} values.title
+ * @returns {Promise<void>}
+ */
 exports.addVisit = async function (profileId, {url, title}) {
   // validate parameters
   if (!url || typeof url !== 'string') {
@@ -54,14 +81,24 @@ exports.addVisit = async function (profileId, {url, title}) {
   }
 }
 
+/**
+ * @param {number} profileId
+ * @param {Object} opts
+ * @param {string} [opts.search]
+ * @param {number} [opts.offset]
+ * @param {number} [opts.limit]
+ * @param {number} [opts.before]
+ * @param {number} [opts.after]
+ * @returns {Promise<Array<Visit>>}
+ */
 exports.getVisitHistory = async function (profileId, {search, offset, limit, before, after}) {
   var release = await lock('history-db')
   try {
-    const params = [
+    const params = /** @type Array<string | number> */([
       profileId,
       limit || 50,
       offset || 0
-    ]
+    ])
     if (search) {
       // prep search terms
       params.push(
@@ -102,6 +139,13 @@ exports.getVisitHistory = async function (profileId, {search, offset, limit, bef
   }
 }
 
+/**
+ * @param {number} profileId
+ * @param {Object} opts
+ * @param {number} [opts.offset]
+ * @param {number} [opts.limit]
+ * @returns {Promise<Array<Visit>>}
+ */
 exports.getMostVisited = async function (profileId, { offset, limit }) {
   var release = await lock('history-db')
   try {
@@ -121,6 +165,10 @@ exports.getMostVisited = async function (profileId, { offset, limit }) {
   }
 }
 
+/**
+ * @param {string} q
+ * @returns {Promise<Array<VisitSearchResult>>}
+ */
 exports.search = async function (q) {
   if (!q || typeof q !== 'string') {
     throw new BadParamError('q must be a string')
@@ -148,6 +196,10 @@ exports.search = async function (q) {
   }
 }
 
+/**
+ * @param {string} url
+ * @returns {Promise<void>}
+ */
 exports.removeVisit = async function (url) {
   // validate parameters
   if (!url || typeof url !== 'string') {
@@ -168,6 +220,10 @@ exports.removeVisit = async function (url) {
   }
 }
 
+/**
+ * @param {number} timestamp
+ * @returns {Promise<void>}
+ */
 exports.removeVisitsAfter = async function (timestamp) {
   var release = await lock('history-db')
   try {
@@ -182,6 +238,9 @@ exports.removeVisitsAfter = async function (timestamp) {
   }
 }
 
+/**
+ * @returns {Promise<void>}
+ */
 exports.removeAllVisits = async function () {
   var release = await lock('history-db')
   db.run('DELETE FROM visits;')
diff --git a/dbs/profile-data-db.js b/dbs/profile-data-db.js
index a4c919b4..b310a93f 100644
--- a/dbs/profile-data-db.js
+++ b/dbs/profile-data-db.js
@@ -14,6 +14,10 @@ var setupPromise
 // exported methods
 // =
 
+/**
+ * @param {Object} opts
+ * @param {string} opts.userDataPath
+ */
 exports.setup = function (opts) {
   // open database
   var dbPath = path.join(opts.userDataPath, 'Profiles')
@@ -21,16 +25,28 @@ exports.setup = function (opts) {
   setupPromise = setupSqliteDB(db, {setup: setupDb, migrations}, '[PROFILES]')
 }
 
+/**
+ * @param {...(string | number | boolean | Array<string | number | boolean>)} args
+ * @return {Promise<any>}
+ */
 exports.get = async function (...args) {
   await setupPromise
   return cbPromise(cb => db.get(...args, cb))
 }
 
+/**
+ * @param {...(string | number | boolean | Array<string | number | boolean>)} args
+ * @return {Promise<Array<any>>}
+ */
 exports.all = async function (...args) {
   await setupPromise
   return cbPromise(cb => db.all(...args, cb))
 }
 
+/**
+ * @param {...(string | number | boolean | Array<string | number | boolean>)} args
+ * @return {Promise<void>}
+ */
 exports.run = async function (...args) {
   await setupPromise
   return cbPromise(cb => db.run(...args, function (err) {
@@ -39,10 +55,16 @@ exports.run = async function (...args) {
   }))
 }
 
+/**
+ * @returns {Promise<void>}
+ */
 exports.serialize = function () {
   return db.serialize()
 }
 
+/**
+ * @returns {Promise<void>}
+ */
 exports.parallelize = function () {
   return db.parallelize()
 }
diff --git a/dbs/settings.js b/dbs/settings.js
index e2fafe4b..0a9ce06d 100644
--- a/dbs/settings.js
+++ b/dbs/settings.js
@@ -16,6 +16,11 @@ var events = new EventEmitter()
 // exported methods
 // =
 
+/**
+ * @param {Object} opts
+ * @param {string} opts.userDataPath
+ * @param {string} opts.homePath
+ */
 exports.setup = function (opts) {
   // open database
   var dbPath = path.join(opts.userDataPath, 'Settings')
@@ -38,10 +43,15 @@ exports.setup = function (opts) {
 exports.on = events.on.bind(events)
 exports.once = events.once.bind(events)
 
+/**
+ * @param {string} key
+ * @param {string | number} value
+ * @returns {Promise<void>}
+ */
 exports.set = function (key, value) {
   events.emit('set', key, value)
   events.emit('set:' + key, value)
-  return setupPromise.then(v => cbPromise(cb => {
+  return setupPromise.then(() => cbPromise(cb => {
     db.run(`
       INSERT OR REPLACE
         INTO settings (key, value, ts)
@@ -50,13 +60,17 @@ exports.set = function (key, value) {
   }))
 }
 
+/**
+ * @param {string} key
+ * @returns {boolean | Promise<string | number>}
+ */
 exports.get = function (key) {
   // env variables
   if (key === 'no_welcome_tab') {
-    return (getEnvVar('BEAKER_NO_WELCOME_TAB') == 1)
+    return (Number(getEnvVar('BEAKER_NO_WELCOME_TAB')) === 1)
   }
   // stored values
-  return setupPromise.then(v => cbPromise(cb => {
+  return setupPromise.then(() => cbPromise(cb => {
     db.get(`SELECT value FROM settings WHERE key = ?`, [key], (err, row) => {
       if (row) { row = row.value }
       if (typeof row === 'undefined') { row = defaultSettings[key] }
@@ -65,6 +79,9 @@ exports.get = function (key) {
   }))
 }
 
+/**
+ * @returns {Promise<Object>}
+ */
 exports.getAll = function () {
   return setupPromise.then(v => cbPromise(cb => {
     db.all(`SELECT key, value FROM settings`, (err, rows) => {
@@ -73,7 +90,7 @@ exports.getAll = function () {
       var obj = {}
       rows.forEach(row => { obj[row.key] = row.value })
       obj = Object.assign({}, defaultSettings, obj)
-      obj.no_welcome_tab = (getEnvVar('BEAKER_NO_WELCOME_TAB') == 1)
+      obj.no_welcome_tab = (Number(getEnvVar('BEAKER_NO_WELCOME_TAB')) === 1)
       cb(null, obj)
     })
   }))
diff --git a/dbs/sitedata.js b/dbs/sitedata.js
index 9fcfe436..b2c181e1 100644
--- a/dbs/sitedata.js
+++ b/dbs/sitedata.js
@@ -8,6 +8,7 @@ const datLibrary = require('../dat/library')
 
 // globals
 // =
+
 var db
 var migrations
 var setupPromise
@@ -15,6 +16,10 @@ var setupPromise
 // exported methods
 // =
 
+/**
+ * @param {Object} opts
+ * @param {string} opts.userDataPath
+ */
 exports.setup = function (opts) {
   // open database
   var dbPath = path.join(opts.userDataPath, 'SiteData')
@@ -22,6 +27,14 @@ exports.setup = function (opts) {
   setupPromise = setupSqliteDB(db, {migrations}, '[SITEDATA]')
 }
 
+/**
+ * @param {string} url
+ * @param {string} key
+ * @param {number | string} value
+ * @param {Object} [opts]
+ * @param {boolean} [opts.dontExtractOrigin]
+ * @returns {Promise<void>}
+ */
 const set = exports.set = async function (url, key, value, opts) {
   await setupPromise
   var origin = opts && opts.dontExtractOrigin ? url : await extractOrigin(url)
@@ -35,6 +48,11 @@ const set = exports.set = async function (url, key, value, opts) {
   })
 }
 
+/**
+ * @param {string} url
+ * @param {string} key
+ * @returns {Promise<void>}
+ */
 const clear = exports.clear = async function (url, key) {
   await setupPromise
   var origin = await extractOrigin(url)
@@ -46,6 +64,13 @@ const clear = exports.clear = async function (url, key) {
   })
 }
 
+/**
+ * @param {string} url
+ * @param {string} key
+ * @param {Object} [opts]
+ * @param {boolean} [opts.dontExtractOrigin]
+ * @returns {Promise<string>}
+ */
 const get = exports.get = async function (url, key, opts) {
   await setupPromise
   var origin = opts && opts.dontExtractOrigin ? url : await extractOrigin(url)
@@ -58,6 +83,10 @@ const get = exports.get = async function (url, key, opts) {
   })
 }
 
+/**
+ * @param {string} url
+ * @returns {Promise<Object>}
+ */
 const getPermissions = exports.getPermissions = async function (url) {
   await setupPromise
   var origin = await extractOrigin(url)
@@ -75,6 +104,10 @@ const getPermissions = exports.getPermissions = async function (url) {
   })
 }
 
+/**
+ * @param {string} url
+ * @returns {Promise<Array<string>>}
+ */
 exports.getNetworkPermissions = async function (url) {
   await setupPromise
   var origin = await extractOrigin(url)
@@ -84,7 +117,7 @@ exports.getNetworkPermissions = async function (url) {
       if (err) return cb(err)
 
       // convert to array
-      var origins = []
+      var origins = /** @type string[] */([])
       if (rows) {
         rows.forEach(row => {
           if (row.value) origins.push(row.key.split(':').pop())
@@ -95,6 +128,10 @@ exports.getNetworkPermissions = async function (url) {
   })
 }
 
+/**
+ * @param {string} url
+ * @returns {Promise<Object>}
+ */
 const getAppPermissions = exports.getAppPermissions = async function (url) {
   await setupPromise
   var origin = await extractOrigin(url)
@@ -117,15 +154,31 @@ const getAppPermissions = exports.getAppPermissions = async function (url) {
   })
 }
 
+/**
+ * @param {string} url
+ * @param {string} key
+ * @returns {Promise<string>}
+ */
 const getPermission = exports.getPermission = function (url, key) {
   return get(url, 'perm:' + key)
 }
 
+/**
+ * @param {string} url
+ * @param {string} key
+ * @param {string | number} value
+ * @returns {Promise<void>}
+ */
 const setPermission = exports.setPermission = function (url, key, value) {
   value = value ? 1 : 0
   return set(url, 'perm:' + key, value)
 }
 
+/**
+ * @param {string} url
+ * @param {Object} appPerms
+ * @returns {Promise<void>}
+ */
 const setAppPermissions = exports.setAppPermissions = async function (url, appPerms) {
   await setupPromise
   var origin = await extractOrigin(url)
@@ -150,10 +203,19 @@ const setAppPermissions = exports.setAppPermissions = async function (url, appPe
   }
 }
 
+/**
+ * @param {string} url
+ * @param {string} key
+ * @returns {Promise<void>}
+ */
 const clearPermission = exports.clearPermission = function (url, key) {
   return clear(url, 'perm:' + key)
 }
 
+/**
+ * @param {string} key
+ * @returns {Promise<void>}
+ */
 const clearPermissionAllOrigins = exports.clearPermissionAllOrigins = async function (key) {
   await setupPromise
   key = 'perm:' + key
@@ -164,26 +226,6 @@ const clearPermissionAllOrigins = exports.clearPermissionAllOrigins = async func
   })
 }
 
-exports.query = async function (values) {
-  await setupPromise
-
-  // massage query
-  if ('origin' in values) {
-    values.origin = await extractOrigin(values.origin)
-  }
-
-  return cbPromise(cb => {
-    // run query
-    const keys = Object.keys(values)
-    const where = keys.map(k => `${k} = ?`).join(' AND ')
-    values = keys.map(k => values[k])
-    db.all(`SELECT * FROM sitedata WHERE ${where}`, values, (err, res) => {
-      if (err) return cb(err)
-      cb(null, res && res.value)
-    })
-  })
-}
-
 exports.WEBAPI = {
   get,
   set,
@@ -199,6 +241,10 @@ exports.WEBAPI = {
 // internal methods
 // =
 
+/**
+ * @param {string} originURL
+ * @returns {Promise<string>}
+ */
 async function extractOrigin (originURL) {
   var urlp = url.parse(originURL)
   if (!urlp || !urlp.host || !urlp.protocol) return
diff --git a/dbs/templates.js b/dbs/templates.js
index 4be48c6c..61a9e387 100644
--- a/dbs/templates.js
+++ b/dbs/templates.js
@@ -1,20 +1,56 @@
 const db = require('./profile-data-db')
 
+// typedefs
+// =
+
+/**
+ * @typedef {Object} Template
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {number} createdAt
+ *
+ * @typedef {Object} TemplateScreenshot
+ * @prop {string} url
+ * @prop {string} screenshot
+ */
+
 // exported api
 // =
 
+/**
+ * @param {number} profileId
+ * @param {string} url
+ * @returns {Promise<Template>}
+ */
 exports.get = function (profileId, url) {
   return db.get(`SELECT url, title, createdAt FROM templates WHERE profileId = ? AND url = ?`, [profileId, url])
 }
 
+/**
+ * @param {number} profileId
+ * @param {string} url
+ * @returns {Promise<TemplateScreenshot>}
+ */
 exports.getScreenshot = function (profileId, url) {
   return db.get(`SELECT url, screenshot FROM templates WHERE profileId = ? AND url = ?`, [profileId, url])
 }
 
+/**
+ * @param {number} profileId
+ * @returns {Promise<Array<Template>>}
+ */
 exports.list = function (profileId) {
   return db.all(`SELECT url, title, createdAt FROM templates WHERE profileId = ? ORDER BY title`, [profileId])
 }
 
+/**
+ * @param {number} profileId
+ * @param {string} url
+ * @param {Object} values
+ * @param {string} values.title
+ * @param {string} values.screenshot
+ * @returns {Promise<void>}
+ */
 exports.put = function (profileId, url, {title, screenshot}) {
   return db.run(`
     INSERT OR REPLACE
@@ -23,6 +59,11 @@ exports.put = function (profileId, url, {title, screenshot}) {
   `, [profileId, url, title, screenshot])
 }
 
+/**
+ * @param {number} profileId
+ * @param {string} url
+ * @returns {Promise<void>}
+ */
 exports.remove = function (profileId, url) {
   return db.run(`DELETE FROM templates WHERE profileId = ? AND url = ?`, [profileId, url])
 }
diff --git a/dbs/watchlist.js b/dbs/watchlist.js
index 71f147a7..a52127c2 100644
--- a/dbs/watchlist.js
+++ b/dbs/watchlist.js
@@ -1,9 +1,31 @@
 const lock = require('../lib/lock')
 const db = require('./profile-data-db')
 
+// typedefs
+// =
+
+/**
+ * @typedef {Object} WatchedSite
+ * @prop {number} profileId
+ * @prop {string} url
+ * @prop {string} description
+ * @prop {boolean} seedWhenResolved
+ * @prop {boolean} resolved
+ * @prop {number} updatedAt
+ * @prop {number} createdAt
+ */
+
 // exported methods
 // =
 
+/**
+ * @param {number} profileId
+ * @param {string} url
+ * @param {Object} opts
+ * @param {string} opts.description
+ * @param {number} opts.seedWhenResolved
+ * @return {Promise<void>}
+ */
 exports.addSite = async function (profileId, url, opts) {
   var release = await lock('watchlist-db')
   try {
@@ -22,23 +44,36 @@ exports.addSite = async function (profileId, url, opts) {
   return db.get('SELECT rowid, * from watchlist WHERE profileId = ? AND url = ?', [profileId, url])
 }
 
+/**
+ * @param {number} profileId
+ * @returns {Promise<Array<WatchedSite>>}
+ */
 exports.getSites = async function (profileId) {
-  return db.all(`SELECT * FROM watchlist WHERE profileId = ?1`, [profileId])
+  return db.all(`SELECT * FROM watchlist WHERE profileId = ?`, [profileId])
 }
 
-exports.updateWatchlist = async function (profileId, site, opts) {
-  var combine = Object.assign(site, opts)
+/**
+ * @param {number} profileId
+ * @param {WatchedSite} site
+ * @returns {Promise<void>}
+ */
+exports.updateWatchlist = async function (profileId, site) {
   var updatedAt = (Date.now() / 1000 | 0)
 
   var release = await lock('watchlist-db')
   try {
     await db.run(`UPDATE watchlist SET seedWhenResolved = ?, resolved = ?, updatedAt = ?
-    WHERE profileId = ? AND url = ?`, [combine.seedWhenResolved, combine.resolved, updatedAt, profileId, combine.url])
+    WHERE profileId = ? AND url = ?`, [site.seedWhenResolved, site.resolved, updatedAt, profileId, site.url])
   } finally {
     release()
   }
 }
 
+/**
+ * @param {number} profileId
+ * @param {string} url
+ * @return {Promise<void>}
+ */
 exports.removeSite = async function (profileId, url) {
   return db.run(`DELETE FROM watchlist WHERE profileId = ? AND url = ?`, [profileId, url])
 }
diff --git a/lib/db.js b/lib/db.js
index 94a4bf29..bc96b35b 100644
--- a/lib/db.js
+++ b/lib/db.js
@@ -46,7 +46,13 @@ exports.makeSqliteTransactor = function (setupPromise) {
   }
 }
 
-// runs needed migrations, returns a promise
+/**
+ * @description Configures SQLite db and runs needed migrations.
+ * @param {any} db
+ * @param {Object} opts
+ * @param {Function} [opts.setup]
+ * @param {Function[]} [opts.migrations]
+ */
 exports.setupSqliteDB = function (db, {setup, migrations}, logTag) {
   return new Promise((resolve, reject) => {
     // configure connection
diff --git a/lib/env.js b/lib/env.js
index 6026e58b..62e7b696 100644
--- a/lib/env.js
+++ b/lib/env.js
@@ -1,3 +1,7 @@
+/**
+ * @param {string} name
+ * @returns {string}
+ */
 exports.getEnvVar = function (name) {
   var ucv = process.env[name.toUpperCase()]
   if (typeof ucv !== 'undefined') {
diff --git a/web-apis/bg/watchlist.js b/web-apis/bg/watchlist.js
index 6459242f..807879b2 100644
--- a/web-apis/bg/watchlist.js
+++ b/web-apis/bg/watchlist.js
@@ -13,8 +13,8 @@ module.exports = {
     return datWatchlist.getSites(0)
   },
 
-  async update (site, opts) {
-    return datWatchlist.updateWatchlist(0, site, opts)
+  async update (site) {
+    return datWatchlist.updateWatchlist(0, site)
   },
 
   async remove (url) {

From 56fbc2013df6e03642ad9f91029557801d2d8e86 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 13 Jan 2019 17:44:47 -0600
Subject: [PATCH 057/245] Add jsdoc annotations to lib scripts

---
 lib/dat.js           |  7 +++++
 lib/db.js            | 43 ++++++++++++++-----------
 lib/debug-logger.js  | 27 +++++++++++++---
 lib/env.js           |  1 +
 lib/error-page.js    | 11 +++++++
 lib/functions.js     | 12 ++++---
 lib/lock.js          | 23 ++++++++------
 lib/mime.js          | 55 +++++++++++++++++++++++++++-----
 lib/scoped-fses.js   | 29 +++++++++++++++++
 lib/spell-checker.js |  2 +-
 lib/strings.js       | 45 +++++++++++++++++++++++++++
 lib/time.js          | 74 ++++++++++++++++++++++++--------------------
 lib/zip.js           | 13 ++++++--
 13 files changed, 262 insertions(+), 80 deletions(-)

diff --git a/lib/dat.js b/lib/dat.js
index 0aaef3cc..a11236f3 100644
--- a/lib/dat.js
+++ b/lib/dat.js
@@ -1,3 +1,10 @@
+/**
+ * @description
+ * Get the first "basic type" found in the dat type array.
+ * "Basic types" are generic descriptions which are used mainly for categorization.
+ * @param {string[]} type
+ * @returns {string}
+ */
 exports.getBasicType = function (type) {
   if (type && Array.isArray(type)) {
     if (type.includes('user')) return 'user'
diff --git a/lib/db.js b/lib/db.js
index bc96b35b..275fdaeb 100644
--- a/lib/db.js
+++ b/lib/db.js
@@ -2,28 +2,35 @@ const debug = require('../lib/debug-logger').debugLogger('beaker-sqlite')
 const FnQueue = require('function-queue')
 const { cbPromise } = require('./functions')
 
-// transaction lock
-// - returns a function which enforces FIFO execution on async behaviors, via a queue
-// - call sig: txLock(cb => { ...; cb() })
-// - MUST call given cb to release the lock
+/**
+ * Create a transaction lock
+ * - returns a function which enforces FIFO execution on async behaviors, via a queue
+ * - call sig: txLock(cb => { ...; cb() })
+ * - MUST call given cb to release the lock
+ * @returns {function(Function): void}
+ */
 const makeTxLock = exports.makeTxLock = function () {
   var fnQueue = FnQueue()
   return cb => fnQueue.push(cb)
 }
 
-// sqlite transactor, handles common needs for sqlite queries:
-// 1. waits for the setupPromise
-// 2. provides a cb handler that returns a promise
-// 3. creates a transaction lock, and wraps the cb with it
-// NOTE:
-//   Using the transactor does mean that the DB is locked into sequential operation.
-//   This is slower, but necessary if the SQLite instance has any transactions that
-//   do async work within them; eg, SELECT then UPDATE.
-//   Why: without the tx lock around all SQLite statements, you can end up injecting
-//   new commands into the active async transaction.
-//   If the DB doesn't do async transactions, you don't need the transactor. At time of
-//   writing this, only the history DB needed it.
-//   -prf
+/**
+ * SQLite transactor, handles common needs for sqlite queries:
+ * 1. waits for the setupPromise
+ * 2. provides a cb handler that returns a promise
+ * 3. creates a transaction lock, and wraps the cb with it
+ * NOTE:
+ *   Using the transactor does mean that the DB is locked into sequential operation.
+ *   This is slower, but necessary if the SQLite instance has any transactions that
+ *   do async work within them; eg, SELECT then UPDATE.
+ *   Why: without the tx lock around all SQLite statements, you can end up injecting
+ *   new commands into the active async transaction.
+ *   If the DB doesn't do async transactions, you don't need the transactor. At time of
+ *   writing this, only the history DB needed it.
+ *   -prf
+ * @param {Promise<any>} setupPromise
+ * @returns {function(Function): Promise<any>}
+ */
 exports.makeSqliteTransactor = function (setupPromise) {
   var txLock = makeTxLock()
   return function (fn) {
@@ -47,7 +54,7 @@ exports.makeSqliteTransactor = function (setupPromise) {
 }
 
 /**
- * @description Configures SQLite db and runs needed migrations.
+ * Configures SQLite db and runs needed migrations.
  * @param {any} db
  * @param {Object} opts
  * @param {Function} [opts.setup]
diff --git a/lib/debug-logger.js b/lib/debug-logger.js
index 8b95860d..ec9ee2d5 100644
--- a/lib/debug-logger.js
+++ b/lib/debug-logger.js
@@ -5,6 +5,9 @@ const concat = require('concat-stream')
 var logFilePath
 var logFileWriteStream
 
+/**
+ * @param {string} p - Path to the log file.
+ */
 exports.setup = function (p) {
   logFilePath = p
   console.log('Logfile:', logFilePath)
@@ -16,22 +19,38 @@ exports.setup = function (p) {
   })
 }
 
+/**
+ * Produces a logger function for the given namespace.
+ * @param {string} namespace
+ * @returns {function(...any): void}
+ */
 exports.debugLogger = function (namespace) {
-  return function (...args) {
+  return function (fmt, ...args) {
     if (logFileWriteStream) {
-      logFileWriteStream.write(namespace + ' ' + format(...args) + '\n')
+      logFileWriteStream.write(namespace + ' ' + format(fmt, ...args) + '\n')
     } else {
-      console.error(namespace + ' ' + format(...args) + '\n')
+      console.error(namespace + ' ' + format(fmt, ...args) + '\n')
     }
   }
 }
 
+/**
+ * @returns {string}
+ */
 exports.getLogFilePath = function () {
   return logFilePath
 }
 
+/**
+ * @param {number} start
+ * @param {number} end
+ * @returns {Promise<string>}
+ */
 exports.getLogFileContent = function (start, end) {
   start = start || 0
   end = end || 10e5
-  return new Promise(resolve => fs.createReadStream(logFilePath, {start, end}).pipe(concat({encoding: 'string'}, resolve)))
+  return new Promise(resolve => (
+    fs.createReadStream(logFilePath, {start, end})
+      .pipe(concat(res => resolve(res.toString('utf8'))))
+  ))
 }
diff --git a/lib/env.js b/lib/env.js
index 62e7b696..cc27bc97 100644
--- a/lib/env.js
+++ b/lib/env.js
@@ -1,4 +1,5 @@
 /**
+ * Helper to get environment variables, ignoring case
  * @param {string} name
  * @returns {string}
  */
diff --git a/lib/error-page.js b/lib/error-page.js
index 6ed1f1bd..b28056e7 100644
--- a/lib/error-page.js
+++ b/lib/error-page.js
@@ -140,6 +140,17 @@ li:last-child {
 }
 `
 
+/**
+ * Generate an error page HTML
+ * @param {Object} e
+ * @param {string} e.resource
+ * @param {number} e.errorCode
+ * @param {string} e.errorDescription
+ * @param {string} e.errorInfo
+ * @param {string} e.title
+ * @param {string} e.validatedURL
+ * @returns {string}
+ */
 module.exports = function (e) {
   var title = 'This site can’t be reached'
   var info = ''
diff --git a/lib/functions.js b/lib/functions.js
index 7295277f..0d8fa9f5 100644
--- a/lib/functions.js
+++ b/lib/functions.js
@@ -1,7 +1,11 @@
-
-// helper to make node-style CBs into promises
-// usage: cbPromise(cb => myNodeStyleMethod(cb)).then(...)
-exports.cbPromise = function (method, b) {
+/**
+ * Helper to make node-style CBs into promises
+ * @example
+ * cbPromise(cb => myNodeStyleMethod(cb)).then(...)
+ * @param {function(Function): any} method
+ * @returns {Promise<any>}
+ */
+exports.cbPromise = function (method) {
   return new Promise((resolve, reject) => {
     method((err, value) => {
       if (err) reject(err)
diff --git a/lib/lock.js b/lib/lock.js
index 5d55c0cf..e15a577b 100644
--- a/lib/lock.js
+++ b/lib/lock.js
@@ -1,17 +1,20 @@
 const AwaitLock = require('await-lock')
 
 // wraps await-lock in a simpler interface, with many possible locks
-// usage:
-/*
-var lock = require('./lock')
-async function foo () {
-  var release = await lock('bar')
-  // ...
-  release()
-}
-*/
-
 var locks = {}
+
+/**
+ * Create a new lock
+ * @example
+ * var lock = require('./lock')
+ * async function foo () {
+ *   var release = await lock('bar')
+ *   // ...
+ *   release()
+ * }
+ * @param {string} key
+ * @returns {Promise<function(): void>}
+ */
 module.exports = async function (key) {
   if (!(key in locks)) locks[key] = new AwaitLock()
 
diff --git a/lib/mime.js b/lib/mime.js
index 7d21e2a9..4c6d63fd 100644
--- a/lib/mime.js
+++ b/lib/mime.js
@@ -10,6 +10,21 @@ const concat = require('concat-stream')
 mime.default_type = 'text/plain'
 const TEXT_TYPE_RE = /^text\/|^application\/(javascript|json)/
 
+// typedefs
+// =
+
+/**
+ * @typedef {import('stream').Transform} Transform
+ */
+
+// exported api
+// =
+
+/**
+ * @param {string} name
+ * @param {Buffer} [chunk]
+ * @returns {string}
+ */
 const identify = exports.identify = function (name, chunk) {
   // try to identify the type by the chunk contents
   var mimeType
@@ -36,6 +51,11 @@ const identify = exports.identify = function (name, chunk) {
   return mimeType
 }
 
+/**
+ * @param {string} name
+ * @param {function(string): any} cb
+ * @returns {Transform}
+ */
 exports.identifyStream = function (name, cb) {
   var first = true
   return through2(function (chunk, enc, cb2) {
@@ -48,6 +68,12 @@ exports.identifyStream = function (name, cb) {
   })
 }
 
+/**
+ * Guesses if the file is binary based on its path.
+ * Returns 'undefined' if no guess can be made.
+ * @param {string} filepath
+ * @returns {boolean | undefined}
+ */
 exports.isFileNameBinary = function (filepath) {
   const ext = path.extname(filepath)
   if (binextensions.includes(ext)) return true
@@ -55,6 +81,12 @@ exports.isFileNameBinary = function (filepath) {
   // dont know
 }
 
+/**
+ * Guesses if the file is binary based on its content.
+ * @param {Object} fsInstance - The filesystem to read from.
+ * @param {string} filepath
+ * @returns {Promise<boolean>}
+ */
 exports.isFileContentBinary = async function (fsInstance, filepath) {
   return new Promise((resolve, reject) => {
     const rs = fsInstance.createReadStream(filepath, {start: 0, end: 512})
@@ -63,17 +95,26 @@ exports.isFileContentBinary = async function (fsInstance, filepath) {
   })
 }
 
-// for a given HTTP accept header, provide a list of file-extensions to try
+/**
+ * For a given HTTP accept header, provide a list of file-extensions to try.
+ * @param {string | undefined} accept
+ * @returns {string[]}
+ */
 exports.acceptHeaderExtensions = function (accept) {
   var exts = []
-  accept = (accept || '').split(',')
-  if (accept.includes('text/html') || (accept.length === 1 && accept[0] === '*/*')) exts.push('.html')
-  if (accept.includes('text/css')) exts.push('.css')
-  if (accept.includes('image/*') || accept.includes('image/apng')) exts = exts.concat(['.png', '.jpg', '.jpeg', '.gif'])
+  var parts = (accept || '').split(',')
+  if (parts.includes('text/html') || (parts.length === 1 && parts[0] === '*/*')) exts.push('.html')
+  if (parts.includes('text/css')) exts.push('.css')
+  if (parts.includes('image/*') || parts.includes('image/apng')) exts = exts.concat(['.png', '.jpg', '.jpeg', '.gif'])
   return exts
 }
 
-// pulled from https://github.com/gjtorikian/isBinaryFile
+/**
+ * Looks for byte patterns that indicate the 'bytes' chunk is from a binary file.
+ * pulled from https://github.com/gjtorikian/isBinaryFile
+ * @param {Buffer} bytes 
+ * @returns {boolean}
+ */
 function isBinaryCheck (bytes) {
   var size = bytes.length
   if (size === 0) {
@@ -102,7 +143,7 @@ function isBinaryCheck (bytes) {
     return false
   }
 
-  if (size >= 5 && bytes.slice(0, 5) == '%PDF-') {
+  if (size >= 5 && bytes.slice(0, 5).toString('utf8') === '%PDF-') {
     /* PDF. This is binary. */
     return true
   }
diff --git a/lib/scoped-fses.js b/lib/scoped-fses.js
index 37d99c51..873ddc2f 100644
--- a/lib/scoped-fses.js
+++ b/lib/scoped-fses.js
@@ -1,5 +1,30 @@
 const ScopedFS = require('scoped-fs')
 
+// typedefs
+// =
+
+/**
+ * TODO- move this into the scoped-fs module
+ * @typedef ScopedFS
+ * @prop {function(function(string): boolean): void} setFilter
+ * @prop {function(string): boolean} _filter
+ * @prop {function(string, [Object]): ReadableStream} createReadStream
+ * @prop {function(string, ...any): void} readFile
+ * @prop {function(string, ...any): (Buffer | string)} readFileSync
+ * @prop {function(string, [Object]): WritableStream} createWriteStream
+ * @prop {function(string, ...any): void} writeFile
+ * @prop {function(string, ...any): void} writeFileSync
+ * @prop {function(string, ...any): void} mkdir
+ * @prop {function(string, Function): void} access
+ * @prop {function(string, Function): void} exists
+ * @prop {function(string, Function): void} lstat
+ * @prop {function(string, Function): void} stat
+ * @prop {function(string, function(any, string[]): void)} readdir
+ * @prop {function(string, Function): void} unlink
+ * @prop {function(string, Function): void} rmdir
+ * @prop {function(string, Function): Object} watch
+ */
+
 // globals
 // =
 
@@ -8,6 +33,10 @@ var scopedFSes = {} // map of scoped filesystems, kept in memory to reduce alloc
 // exported APIs
 // =
 
+/**
+ * @param {string} path
+ * @returns {ScopedFS}
+ */
 exports.get = function (path) {
   if (!(path in scopedFSes)) {
     scopedFSes[path] = new ScopedFS(path)
diff --git a/lib/spell-checker.js b/lib/spell-checker.js
index 37c4ced3..861cc5ff 100644
--- a/lib/spell-checker.js
+++ b/lib/spell-checker.js
@@ -36,7 +36,7 @@ exports.setup = function () {
 
     if (process.platform === 'linux') {
         setupLinux(locale)
-    } else if (process.platform === 'windows' && semver.lt(os.release(), '8.0.0')) {
+    } else if (process.platform === 'win32' && semver.lt(os.release(), '8.0.0')) {
         setupWin7AndEarlier(locale)
     } else {
         // OSX and Windows 8+ have OS-level spellcheck APIs
diff --git a/lib/strings.js b/lib/strings.js
index 6e28ec50..29c8f322 100644
--- a/lib/strings.js
+++ b/lib/strings.js
@@ -2,23 +2,51 @@
 
 const URL = typeof window === 'undefined' ? require('url').URL : window.URL
 
+/**
+ * Extracts the permission ID from the given permission token.
+ * @param {string} permissionToken
+ * @returns {string}
+ */
 exports.getPermId = function (permissionToken) {
   return permissionToken.split(':')[0]
 }
 
+/**
+ * Extracts the permission parameter from the given permission token.
+ * @param {string} permissionToken
+ * @returns {string}
+ */
 exports.getPermParam = function (permissionToken) {
   return permissionToken.split(':').slice(1).join(':')
 }
 
+/**
+ * Uppercase the first letter.
+ * @param {string} str
+ * @returns {string}
+ */
 exports.ucfirst = function (str) {
   return str.charAt(0).toUpperCase() + str.slice(1)
 }
 
+/**
+ * Makes the word plural if num !== 1.
+ * @param {number} num
+ * @param {string} base
+ * @param {string} [suffix='s']
+ * @returns {string}
+ */
 exports.pluralize = function (num, base, suffix = 's') {
   if (num === 1) { return base }
   return base + suffix
 }
 
+/**
+ * Enforces a string length and adds ellipsis if truncation is needed.
+ * @param {string} str
+ * @param {number} [n = 6]
+ * @returns {string}
+ */
 exports.shorten = function (str, n = 6) {
   if (str.length > (n + 3)) {
     return str.slice(0, n) + '...'
@@ -26,6 +54,12 @@ exports.shorten = function (str, n = 6) {
   return str
 }
 
+/**
+ * Like shorten() but for dat URLs or keys.
+ * @param {string} str
+ * @param {number} [n = 6]
+ * @returns {string}
+ */
 const shortenHash = exports.shortenHash = function (str, n = 6) {
   if (str.startsWith('dat://')) {
     return 'dat://' + shortenHash(str.slice('dat://'.length).replace(/\/$/, '')) + '/'
@@ -36,10 +70,21 @@ const shortenHash = exports.shortenHash = function (str, n = 6) {
   return str
 }
 
+/**
+ * Remove any markup so that an untrusted string can be safely placed inside HTML.
+ * @param {string} str
+ * @returns {string}
+ */
 exports.makeSafe = function (str) {
   return str.replace(/</g, '&lt;').replace(/>/g, '&gt;').replace(/&/g, '&amp;').replace(/"/g, '')
 }
 
+/**
+ * Extracts the hostname from the given URL.
+ * Will shorten the output if a dat pubkey.
+ * @param {string} str
+ * @returns {string}
+ */
 exports.getHostname = function (str) {
   try {
     const u = new URL(str)
diff --git a/lib/time.js b/lib/time.js
index be669689..87187033 100644
--- a/lib/time.js
+++ b/lib/time.js
@@ -1,10 +1,22 @@
 const moment = require('moment')
 const {TimeoutError} = require('beaker-error-constants')
 
-moment.updateLocale('en', {
+/**
+ * @typedef {import('moment').Moment} Moment
+ * @typedef {import('moment').LocaleSpecification} LocaleSpecification
+ * */
+
+moment.updateLocale('en', /** @type LocaleSpecification */({
   relativeTime: {s: 'seconds'}
-})
+}))
 
+/**
+ * Create a relative date string.
+ * @param {number | Date | Moment} ts
+ * @param {Object} [opts]
+ * @param {boolean} [opts.noTime] - Don't include the time of the day if today (just say 'today').
+ * @returns {string}
+ */
 exports.niceDate = function (ts, opts) {
   const endOfToday = moment().endOf('day')
   if (typeof ts === 'number' || ts instanceof Date) { ts = moment(ts) }
@@ -15,38 +27,32 @@ exports.niceDate = function (ts, opts) {
   return ts.format('ll')
 }
 
-exports.downloadTimestamp = function (ts) {
-  if (typeof ts === 'string') {
-    ts = moment(Number(ts))
-  } else if (typeof ts === 'number') {
-    ts = moment(ts)
-  }
-  return moment(ts).local().format('ddd MMM D, h:mma')
-}
-
-// this is a wrapper for any behavior that needs to maintain a timeout
-// you call it like this:
-/*
-timer(30e3, async (checkin, pause, resume) => {
-  checkin('doing work')
-  await work()
-
-  checkin('doing other work')
-  await otherWork()
-
-  pause() // dont count this period against the timeout
-  await askUserSomething()
-  resume() // resume the timeout
-
-  checkin('finishing')
-  return finishing()
-})
-*/
-// Rules of usage:
-// - Call `checkin` after a period of async work to give the timer a chance to
-//   abort further work. If the timer has expired, checkin() will stop running.
-// - Give `checkin` a description of the task if you want the timeouterror to be
-//   descriptive.
+/**
+ * A wrapper for any behavior that needs to maintain a timeout.
+ * Rules of usage:
+ * - Call `checkin` after a period of async work to give the timer a chance to
+ *   abort further work. If the timer has expired, checkin() will stop running.
+ * - Give `checkin` a description of the task if you want the timeouterror to be
+ *   descriptive.
+ * @example
+ * timer(30e3, async (checkin, pause, resume) => {
+ *   checkin('doing work')
+ *   await work()
+ * 
+ *   checkin('doing other work')
+ *   await otherWork()
+ * 
+ *   pause() // dont count this period against the timeout
+ *   await askUserSomething()
+ *   resume() // resume the timeout
+ * 
+ *   checkin('finishing')
+ *   return finishing()
+ * })
+ * @param {number} ms
+ * @param {function(Function, Function, Function): Promise<any>} fn
+ * @returns {Promise<any>}
+ */
 exports.timer = function (ms, fn) {
   var currentAction
   var isTimedOut = false
diff --git a/lib/zip.js b/lib/zip.js
index ee7cb310..91306f65 100644
--- a/lib/zip.js
+++ b/lib/zip.js
@@ -1,11 +1,20 @@
 const {join} = require('path')
 const yazl = require('yazl')
 
-exports.toZipStream = function (archive, dirpath) {
+/**
+ * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
+ * @typedef {import('stream').Readable} Readable
+ */
+
+/**
+ * @param {InternalDatArchive} archive
+ * @param {string} [dirpath = '/']
+ * @returns {Readable}
+ */
+exports.toZipStream = function (archive, dirpath = '/') {
   var zipfile = new yazl.ZipFile()
 
   // create listing stream
-  dirpath = dirpath || '/'
   archive.pda.readdir(dirpath, {recursive: true}).then(async (paths) => {
     for (let path of paths) {
       let readPath = join(dirpath, path)

From 43a11542c4d2dc5859096de0f5f446ac73e4dbda Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 14 Jan 2019 11:46:48 -0600
Subject: [PATCH 058/245] Add some more jsdoc annotations to the dat code (not
 100% done)

---
 dat/daemon/index.js           |  4 ++
 dat/daemon/manifest.js        | 96 +++++++++++++++++++++++++++++++++++
 dat/debugging.js              |  9 ++++
 dat/directory-listing-page.js | 16 ++++--
 dat/garbage-collector.js      | 19 +++++++
 dat/library.js                | 44 ++++++++++++----
 dbs/profile-data-db.js        | 10 +++-
 index.js                      |  6 +--
 lib/mime.js                   |  2 +-
 lib/time.js                   |  6 +--
 users/index.js                | 66 +++++++++++++++++++++---
 11 files changed, 251 insertions(+), 27 deletions(-)

diff --git a/dat/daemon/index.js b/dat/daemon/index.js
index 4b25b8eb..8e9103db 100644
--- a/dat/daemon/index.js
+++ b/dat/daemon/index.js
@@ -103,6 +103,10 @@ const RPC_API = {
   // setup & config
   // =
 
+  /**
+   * @method
+   * @param {*} opts 
+   */
   async setup (opts) {
     datPath = opts.datPath
     folderSync.setup(opts)
diff --git a/dat/daemon/manifest.js b/dat/daemon/manifest.js
index c926f07a..9fd66f7d 100644
--- a/dat/daemon/manifest.js
+++ b/dat/daemon/manifest.js
@@ -1,3 +1,99 @@
+/**
+ * @typedef {import('../../dbs/archives').LibraryArchiveUserSettings} LibraryArchiveUserSettings
+ *  
+ * @typedef {Object} DatDaemon
+ * @prop {function(DatDaemonSetupOpts): Promise<void>} setup
+ * @prop {function(DatDaemonThrottleOpts): Promise<void>} setBandwidthThrottle
+ * @prop {function(): NodeJS.ReadableStream} createEventStream
+ * @prop {function(): NodeJS.ReadableStream} createDebugStream
+ * @prop {function(string): Promise<string>} getDebugLog
+ * @prop {function(string | Buffer, LibraryArchiveUserSettings): Promise<void>} configureArchive
+ * @prop {function(string | Buffer): Promise<DatDaemonArchiveInfo>} getArchiveInfo
+ * @prop {function(string | Buffer): Promise<number>} updateSizeTracking
+ * @prop {function(DatDaemonLoadArchiveOpts): Promise<DatDaemonLoadedArchiveInfo>} loadArchive
+ * @prop {function(string): Promise<void>} unloadArchive
+ * @prop {function(any=, ...any=): void} callArchiveAsyncMethod
+ * @prop {function(any=, ...any=): NodeJS.ReadableStream} callArchiveReadStreamMethod
+ * @prop {function(any=, ...any=): NodeJS.WritableStream} callArchiveWriteStreamMethod
+ * @prop {function(any=, ...any=): Promise<any>} callArchivePDAPromiseMethod
+ * @prop {function(any=, ...any=): NodeJS.ReadableStream} callArchivePDAReadStreamMethod
+ * @prop {function(string | Buffer, LibraryArchiveUserSettings): Promise<void>} clearFileCache
+ * @prop {function(Object): Promise<Object>} exportFilesystemToArchive
+ * @prop {function(Object): Promise<Object>} exportArchiveToFilesystem
+ * @prop {function(Object): Promise<Object>} exportArchiveToArchive
+ * @prop {function(string): Promise<void>} fs_assertSafePath
+ * @prop {function(string | Buffer): Promise<void>} fs_ensureSyncFinished
+ * @prop {function(string | Buffer, [DatDaemonFSDiffListingOpts]): Promise<DatDaemonFSListingDiff>} fs_diffListing
+ * @prop {function(string | Buffer, string): Promise<DatDaemonFSFileDiff>} fs_diffFile
+ * @prop {function(string | Buffer, DatDaemonFSQueueSyncEventOpts): Promise<void>} fe_queueSyncEvent
+ * @prop {function(string | Buffer, [DatDaemonFSDiffListingOpts]): Promise<void>} fs_syncFolderToArchive
+ * @prop {function(string | Buffer, [DatDaemonFSDiffListingOpts]): Promise<void>} fs_syncArchiveToFolder
+ * @prop {function(any=, ...any=): Promise<any>} ext_listPeers
+ * @prop {function(any=, ...any=): Promise<any>} ext_getPeer
+ * @prop {function(any=, ...any=): Promise<any>} ext_broadcastEphemeralMessage
+ * @prop {function(any=, ...any=): Promise<any>} ext_sendEphemeralMessage
+ * @prop {function(any=, ...any=): Promise<any>} ext_getSessionData
+ * @prop {function(any=, ...any=): Promise<any>} ext_setSessionData
+ * @prop {function(any=, ...any=): NodeJS.ReadableStream} ext_createDatPeersStream
+ * NOTE: the ext_* methods are temporary so Im not going to bother documenting their types
+ * 
+ * @typedef {Object} DatDaemonSetupOpts
+ * @prop {string} datPath
+ * @prop {string[]} disallowedSavePaths
+ * 
+ * @typedef {Object} DatDaemonThrottleOpts
+ * @prop {number} [up]
+ * @prop {number} [down]
+ * 
+ * @typedef {Object} DatDaemonLoadArchiveOpts
+ * @prop {string | Buffer} key
+ * @prop {Buffer} [secretKey]
+ * @prop {string} metaPath
+ * @prop {LibraryArchiveUserSettings} userSettings
+ * 
+ * @typedef {Object} DatDaemonFSDiffListingOpts
+ * @prop {boolean} [shallow] - Dont descend into changed folders (default true)
+ * @prop {boolean} [compareContent] - Compare the actual content (default true)
+ * @prop {string[]} [paths] - A whitelist of files to compare
+ * @prop {string} [localSyncPath] - Override the archive localSyncPath
+ * @prop {boolean} [addOnly] - Dont modify or remove any files (default false)
+ * 
+ * @typedef {Object} DatDaemonFSQueueSyncEventOpts
+ * @prop {boolean} toFolder
+ * @prop {boolean} toArchive
+ * 
+ * @typedef {Object} DatDaemonLoadedArchiveInfo
+ * @prop {Buffer} discoveryKey
+ * @prop {boolean} writable
+ * 
+ * @typedef {never} DatDaemonPeerInfo
+ * TODO- what's in here?
+ * 
+ * @typedef {Object} DatDaemonPeerHistory
+ * @prop {number} ts
+ * @prop {number} peers
+ * 
+ * @typedef {Object} DatDaemonNetworkStats
+ * @prop {number} downloadSpeed
+ * @prop {number} uploadSpeed
+ * @prop {number} downloadTotal
+ * @prop {number} uploadTotal
+ * 
+ * @typedef {Object} DatDaemonArchiveInfo
+ * @prop {number} version
+ * @prop {number} size
+ * @prop {number} peers
+ * @prop {DatDaemonPeerInfo[]} peerInfo
+ * @prop {DatDaemonPeerHistory[]} peerHistory
+ * @prop {DatDaemonNetworkStats} networkStats
+ * 
+ * @typedef {never} DatDaemonFSListingDiff
+ * TODO - what's in here?
+ * 
+ * @typedef {never} DatDaemonFSFileDiff
+ * TODO - what's in here?
+ */
+
 module.exports = {
   // setup & config
 
diff --git a/dat/debugging.js b/dat/debugging.js
index 1daf1634..b7dc0351 100644
--- a/dat/debugging.js
+++ b/dat/debugging.js
@@ -1,6 +1,9 @@
 const {getActiveArchives} = require('./library')
 const datDns = require('./dns')
 
+/**
+ * @returns {string}
+ */
 exports.archivesDebugPage = function () {
   var archives = getActiveArchives()
   return `<html>
@@ -24,6 +27,9 @@ exports.archivesDebugPage = function () {
   </html>`
 }
 
+/**
+ * @returns {string}
+ */
 exports.datDnsCachePage = function () {
   var cache = datDns.listCache()
   return `<html>
@@ -41,6 +47,9 @@ exports.datDnsCachePage = function () {
   </html>`
 }
 
+/**
+ * @returns {string}
+ */
 exports.datDnsCacheJS = function () {
   return `
     document.querySelector('button').addEventListener('click', clear)
diff --git a/dat/directory-listing-page.js b/dat/directory-listing-page.js
index 89ccb3de..18a75881 100644
--- a/dat/directory-listing-page.js
+++ b/dat/directory-listing-page.js
@@ -2,6 +2,8 @@ const {pluralize, makeSafe} = require('../lib/strings')
 const {stat, readdir} = require('pauls-dat-api')
 const {join, relative} = require('path')
 
+/** @typedef {import('./library').InternalDatArchive} InternalDatArchive */
+
 const styles = `<style>
   .entry {
     background: no-repeat center left;
@@ -20,6 +22,12 @@ const styles = `<style>
   }
 </style>`
 
+/**
+ * @prop {InternalDatArchive} archive
+ * @prop {string} dirPath
+ * @prop {string} webRoot
+ * @returns {Promise<string>}
+ */
 module.exports = async function renderDirectoryListingPage (archive, dirPath, webRoot) {
   // handle the webroot
   webRoot = webRoot || '/'
@@ -31,14 +39,14 @@ module.exports = async function renderDirectoryListingPage (archive, dirPath, we
   try { names = await readdir(archive, realPath(dirPath)) } catch (e) {}
 
   // stat each file
-  var entries = await Promise.all(names.map(async (name) => {
+  var entries = /** @type any[] */(await Promise.all(names.map(async (name) => {
     var entry
     var entryPath = join(dirPath, name)
     try { entry = await stat(archive, realPath(entryPath)) } catch (e) { return false }
     entry.path = webrootPath(entryPath)
     entry.name = name
     return entry
-  }))
+  })))
   entries = entries.filter(Boolean)
 
   // sort the listing
@@ -58,7 +66,7 @@ module.exports = async function renderDirectoryListingPage (archive, dirPath, we
 
   // render entries
   var totalFiles = 0
-  entries = entries.map(entry => {
+  var entriesStr = entries.map(entry => {
     totalFiles++
     var url = makeSafe(entry.path)
     if (!url.startsWith('/')) url = '/' + url // all urls should have a leading slash
@@ -71,5 +79,5 @@ module.exports = async function renderDirectoryListingPage (archive, dirPath, we
   var summary = `<div class="entry">${totalFiles} ${pluralize(totalFiles, 'file')}</div>`
 
   // render final
-  return '<meta charset="UTF-8">' + styles + updog + entries + summary
+  return '<meta charset="UTF-8">' + styles + updog + entriesStr + summary
 }
diff --git a/dat/garbage-collector.js b/dat/garbage-collector.js
index 21002150..6b50290d 100644
--- a/dat/garbage-collector.js
+++ b/dat/garbage-collector.js
@@ -6,6 +6,16 @@ const {
 } = require('../lib/const')
 const debug = require('../lib/debug-logger').debugLogger('datgc')
 
+// typedefs
+// =
+
+/**
+ * @typedef {Object} CollectResult
+ * @prop {number} totalBytes
+ * @prop {number} totalArchives
+ * @prop {number} skippedArchives
+ */
+
 // globals
 // =
 
@@ -18,6 +28,12 @@ exports.setup = function () {
   schedule(DAT_GC_FIRST_COLLECT_WAIT)
 }
 
+/**
+ * @param {Object} [opts]
+ * @param {number} [opts.olderThan]
+ * @param {boolean} [opts.isOwner]
+ * @returns {Promise<CollectResult>}
+ */
 const collect = exports.collect = async function ({olderThan, isOwner} = {}) {
   // clear any scheduled GC
   if (nextGCTimeout) {
@@ -60,6 +76,9 @@ const collect = exports.collect = async function ({olderThan, isOwner} = {}) {
 // helpers
 // =
 
+/**
+ * @param {number} time 
+ */
 function schedule (time) {
   nextGCTimeout = setTimeout(collect, time)
   nextGCTimeout.unref()
diff --git a/dat/library.js b/dat/library.js
index d7b8fd46..ce75a818 100644
--- a/dat/library.js
+++ b/dat/library.js
@@ -30,6 +30,9 @@ const DAT_DAEMON_MANIFEST = require('./daemon/manifest')
 // =
 
 /**
+ * @typedef {import('./daemon/manifest').DatDaemon} DatDaemon
+ * @typedef {import('../dbs/archives').LibraryArchiveRecord} LibraryArchiveRecord
+ * 
  * @typedef {Object} InternalDatArchive
  * @prop {Buffer} key
  * @prop {string} url
@@ -37,11 +40,11 @@ const DAT_DAEMON_MANIFEST = require('./daemon/manifest')
  * @prop {boolean} writable
  * @prop {function(Function): void} ready
  * @prop {function(Object, Function=): void} download
- * @prop {function(Object=): ReadableStream} history
- * @prop {function(Object=): ReadableStream} createReadStream
+ * @prop {function(Object=): NodeJS.ReadableStream} history
+ * @prop {function(Object=): NodeJS.ReadableStream} createReadStream
  * @prop {function(string, Object=, Function=): any} readFile
- * @prop {function(number, Object=): ReadableStream} createDiffStream
- * @prop {function(string, Object=): WritableStream} createWriteStream
+ * @prop {function(number, Object=): NodeJS.ReadableStream} createDiffStream
+ * @prop {function(string, Object=): NodeJS.WritableStream} createWriteStream
  * @prop {function(string, any, Object=, Function=): void} writeFile
  * @prop {function(string, Function=): void} unlink
  * @prop {function(string, Object=, Function=): void} mkdir
@@ -62,8 +65,8 @@ const DAT_DAEMON_MANIFEST = require('./daemon/manifest')
  * @prop {function(string): Promise<void>} pda.unlink
  * @prop {function(string, Object=): Promise<void>} pda.rmdir
  * @prop {function(string=): Promise<void>} pda.download
- * @prop {function(string=): ReadableStream} pda.watch
- * @prop {function(): ReadableStream} pda.createNetworkActivityStream
+ * @prop {function(string=): NodeJS.ReadableStream} pda.watch
+ * @prop {function(): NodeJS.ReadableStream} pda.createNetworkActivityStream
  * @prop {function(): Promise<Object>} pda.readManifest
  * @prop {function(Object): Promise<void>} pda.writeManifest
  * @prop {function(Object): Promise<void>} pda.updateManifest
@@ -76,11 +79,18 @@ var archives = {} // in-memory cache of archive objects. key -> archive
 var archiveLoadPromises = {} // key -> promise
 var archivesEvents = new EventEmitter()
 var daemonEvents
-var daemon
+var daemon = /** @type DatDaemon */({})
 
 // exported API
 // =
 
+/**
+ * @param {Object} opts
+ * @param {Object} opts.rpcAPI
+ * @param {Object} opts.datDaemonProcess
+ * @param {string[]} opts.disallowedSavePaths
+ * @return {Promise<void>}
+ */
 exports.setup = async function setup ({rpcAPI, datDaemonProcess, disallowedSavePaths}) {
   // connect to the daemon
   daemon = rpcAPI.importAPI('dat-daemon', DAT_DAEMON_MANIFEST, {proc: datDaemonProcess, timeout: false})
@@ -133,12 +143,18 @@ exports.setup = async function setup ({rpcAPI, datDaemonProcess, disallowedSaveP
   datGC.setup()
 }
 
+/**
+ * @returns {DatDaemon}
+ */
 exports.getDaemon = () => daemon
 
+/**
+ * @returns {Promise<void>}
+ */
 exports.loadSavedArchives = function () {
   // load and configure all saved archives
   return archivesDb.query(0, {isSaved: true}).then(
-    async (archives) => {
+    async (/** @type LibraryArchiveRecord[] */archives) => {
       // HACK
       // load the archives one at a time and give 5 seconds between each
       // why: the purpose of loading saved archives is to seed them
@@ -156,14 +172,24 @@ exports.loadSavedArchives = function () {
   )
 }
 
+/**
+ * @returns {NodeJS.ReadableStream}
+ */
 exports.createEventStream = function createEventStream () {
-  return emitStream(archivesEvents)
+  return emitStream.toStream(archivesEvents)
 }
 
+/**
+ * @param {string} key
+ * @returns {Promise<string>}
+ */
 exports.getDebugLog = function getDebugLog (key) {
   return daemon.getDebugLog(key)
 }
 
+/**
+ * @returns {NodeJS.ReadableStream}
+ */
 exports.createDebugStream = function createDebugStream () {
   return daemon.createDebugStream()
 }
diff --git a/dbs/profile-data-db.js b/dbs/profile-data-db.js
index b310a93f..b11d3c0f 100644
--- a/dbs/profile-data-db.js
+++ b/dbs/profile-data-db.js
@@ -4,6 +4,14 @@ const fs = require('fs')
 const {cbPromise} = require('../lib/functions')
 const {setupSqliteDB} = require('../lib/db')
 
+// typedefs
+// =
+
+/**
+ * @typedef {Object} SQLiteResult
+ * @prop {string} lastID
+ */
+
 // globals
 // =
 
@@ -45,7 +53,7 @@ exports.all = async function (...args) {
 
 /**
  * @param {...(string | number | boolean | Array<string | number | boolean>)} args
- * @return {Promise<void>}
+ * @return {Promise<SQLiteResult>}
  */
 exports.run = async function (...args) {
   await setupPromise
diff --git a/index.js b/index.js
index 28c92013..b20e6338 100644
--- a/index.js
+++ b/index.js
@@ -54,9 +54,9 @@ module.exports = {
     // (order is important)
     await dat.library.setup(opts)
     await dat.watchlist.setup()
-    await crawler.setup(opts)
-    await users.setup(opts)
-    webapis.setup(opts)
+    await crawler.setup()
+    await users.setup()
+    webapis.setup()
     spellCheckerLib.setup()
   }
 }
diff --git a/lib/mime.js b/lib/mime.js
index 4c6d63fd..8c5d0bd0 100644
--- a/lib/mime.js
+++ b/lib/mime.js
@@ -112,7 +112,7 @@ exports.acceptHeaderExtensions = function (accept) {
 /**
  * Looks for byte patterns that indicate the 'bytes' chunk is from a binary file.
  * pulled from https://github.com/gjtorikian/isBinaryFile
- * @param {Buffer} bytes 
+ * @param {Buffer} bytes
  * @returns {boolean}
  */
 function isBinaryCheck (bytes) {
diff --git a/lib/time.js b/lib/time.js
index 87187033..0c1b3932 100644
--- a/lib/time.js
+++ b/lib/time.js
@@ -38,14 +38,14 @@ exports.niceDate = function (ts, opts) {
  * timer(30e3, async (checkin, pause, resume) => {
  *   checkin('doing work')
  *   await work()
- * 
+ *
  *   checkin('doing other work')
  *   await otherWork()
- * 
+ *
  *   pause() // dont count this period against the timeout
  *   await askUserSomething()
  *   resume() // resume the timeout
- * 
+ *
  *   checkin('finishing')
  *   return finishing()
  * })
diff --git a/users/index.js b/users/index.js
index e90b615f..c0b0ef3b 100644
--- a/users/index.js
+++ b/users/index.js
@@ -13,6 +13,21 @@ const SITE_TYPE = 'unwalled.garden/user'
 const CRAWL_TICK_INTERVAL = 5e3
 const NUM_SIMULTANEOUS_CRAWLS = 10
 
+// typedefs
+// =
+
+/**
+ * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
+ * 
+ * @typedef {Object} User
+ * @prop {string} url
+ * @prop {InternalDatArchive} archive
+ * @prop {boolean} isDefault
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {Date} createdAt
+ */
+
 // globals
 // =
 
@@ -26,6 +41,9 @@ exports.on = events.on.bind(events)
 exports.addListener = events.addListener.bind(events)
 exports.removeListener = events.removeListener.bind(events)
 
+/**
+ * @returns {Promise<void>}
+ */
 exports.setup = async function () {
   // initiate ticker
   queueTick()
@@ -56,6 +74,9 @@ function queueTick () {
   setTimeout(tick, CRAWL_TICK_INTERVAL)
 }
 
+/**
+ * @returns {Promise<void>}
+ */
 async function tick () {
   try {
     // TODO handle multiple users
@@ -95,10 +116,17 @@ async function tick () {
   queueTick()
 }
 
+/**
+ * @returns {Promise<User[]>}
+ */
 exports.list = async function () {
   return Promise.all(users.map(fetchUserInfo))
 }
 
+/**
+ * @param {string} url
+ * @return {Promise<User>}
+ */
 const get =
 exports.get = async function (url) {
   url = normalizeUrl(url)
@@ -107,6 +135,9 @@ exports.get = async function (url) {
   return await fetchUserInfo(user)
 }
 
+/** 
+ * @return {Promise<User>}
+ */
 const getDefault =
 exports.getDefault = async function () {
   var user = users.find(user => user.isDefault === true)
@@ -114,6 +145,10 @@ exports.getDefault = async function () {
   return await fetchUserInfo(user)
 }
 
+/**
+ * @param {string} url
+ * @returns {Promise<void>}
+ */
 exports.add = async function (url) {
   // make sure the user doesnt already exist
   url = normalizeUrl(url)
@@ -143,6 +178,10 @@ exports.add = async function (url) {
   events.emit('load-user', user)
 }
 
+/**
+ * @param {string} url
+ * @returns {Promise<void>}
+ */
 exports.remove = async function (url) {
   url = normalizeUrl(url)
   // get the user
@@ -159,17 +198,16 @@ exports.remove = async function (url) {
 // internal methods
 // =
 
+/**
+ * @param {string} url 
+ * @return {Promise<boolean>}
+ */
 async function isUser (url) {
   return !!(await get(url))
 }
 
 /**
- * @description
- * Assembles a list of crawl targets based on the current database state.
- *
- * @param {Object} user - the user to select crawl-targets for.
- * @returns {Promise<Array<string>>}
- *
+ * Assembles a list of crawl targets based on the current database state. *
  * Depends on NUM_SIMULTANEOUS_CRAWLS.
  *
  * This function will assemble the list using simple priority heuristics. The priorities are currently:
@@ -183,6 +221,9 @@ async function isUser (url) {
  *
  * NOTE. The current database state must be queried every time this function is run because the user
  * will follow and unfollow during runtime, which changes the list.
+ *
+ * @param {Object} user - the user to select crawl-targets for.
+ * @returns {Promise<Array<string>>}
  */
 async function selectNextCrawlTargets (user) {
   var rows = []
@@ -213,11 +254,16 @@ async function selectNextCrawlTargets (user) {
   return nextCrawlTargets.map(row => typeof row === 'string' ? row : row.url)
 }
 
+/**
+ * @param {Object} user 
+ * @returns {Promise<User>}
+ */
 async function fetchUserInfo (user) {
   var urlp = new URL(user.url)
   var meta = await archivesDb.getMeta(urlp.hostname)
   return {
     url: normalizeUrl(user.url),
+    archive: user.archive,
     isDefault: user.isDefault,
     title: meta.title,
     description: meta.description,
@@ -225,10 +271,18 @@ async function fetchUserInfo (user) {
   }
 }
 
+/**
+ * @param {string} url 
+ * @returns {string}
+ */
 function normalizeUrl (url) {
   return url ? url.replace(/(\/)$/, '') : url
 }
 
+/**
+ * @param {string} url 
+ * @returns {Promise<void>}
+ */
 async function validateUserUrl (url) {
   // make sure the archive is saved and that we own the archive
   var urlp = new URL(url)

From 634a80202392930c9570f033502f58b5c7f0742e Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 14 Jan 2019 16:22:08 -0600
Subject: [PATCH 059/245] Add published-sites to crawler and implement pages
 search

---
 crawler/index.js                    |   3 +
 crawler/published-sites.js          | 293 ++++++++++++++++++++++++++++
 crawler/search.js                   |  61 +++++-
 crawler/site-descriptions.js        |   2 +-
 dat/daemon/index.js                 |   2 +-
 dat/daemon/manifest.js              |  26 +--
 dat/garbage-collector.js            |   2 +-
 dat/library.js                      |   2 +-
 dbs/schemas/profile-data.sql.js     |  11 ++
 dbs/schemas/profile-data.v24.sql.js |  11 ++
 users/index.js                      |  23 +--
 11 files changed, 405 insertions(+), 31 deletions(-)
 create mode 100644 crawler/published-sites.js

diff --git a/crawler/index.js b/crawler/index.js
index 52bbd18d..3d3df79c 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -10,6 +10,7 @@ const dat = require('../dat')
 const {crawlerEvents, toHostname} = require('./util')
 const posts = require('./posts')
 const followgraph = require('./followgraph')
+const publishedSites = require('./published-sites')
 const siteDescriptions = require('./site-descriptions')
 
 // globals
@@ -22,6 +23,7 @@ var watches = {}
 
 exports.posts = posts
 exports.followgraph = followgraph
+exports.publishedSites = publishedSites
 exports.siteDescriptions = siteDescriptions
 const createEventsStream = exports.createEventsStream = () => emitStream(crawlerEvents)
 
@@ -79,6 +81,7 @@ exports.crawlSite = async function (archive) {
     await Promise.all([
       posts.crawlSite(archive, crawlSource),
       followgraph.crawlSite(archive, crawlSource),
+      publishedSites.crawlSite(archive, crawlSource),
       siteDescriptions.crawlSite(archive, crawlSource)
     ])
   } catch (err) {
diff --git a/crawler/published-sites.js b/crawler/published-sites.js
new file mode 100644
index 00000000..57b068d5
--- /dev/null
+++ b/crawler/published-sites.js
@@ -0,0 +1,293 @@
+const assert = require('assert')
+const _difference = require('lodash.difference')
+const Events = require('events')
+const {URL} = require('url')
+const lock = require('../lib/lock')
+const db = require('../dbs/profile-data-db')
+const crawler = require('./index')
+const siteDescriptions = require('./site-descriptions')
+const {doCrawl, doCheckpoint, emitProgressEvent} = require('./util')
+const debug = require('../lib/debug-logger').debugLogger('crawler')
+
+// constants
+// =
+
+const TABLE_VERSION = 1
+const JSON_TYPE = 'unwalled.garden/published-sites'
+const JSON_PATH = '/data/sites.json'
+
+// typedefs
+// =
+
+/**
+ * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
+ * @typedef {import('./util').CrawlSourceRecord} CrawlSourceRecord
+ * @typedef {import('./site-descriptions').SiteDescription} SiteDescription
+ * 
+ * @typedef {Object} PublishedSites
+ * @prop {SiteDescription} author
+ * @prop {SiteDescription[]} sites
+ */
+
+// globals
+// =
+
+var events = new Events()
+
+// exported api
+// =
+
+exports.on = events.on.bind(events)
+exports.addListener = events.addListener.bind(events)
+exports.removeListener = events.removeListener.bind(events)
+
+/**
+ * @description
+ * Crawl the given site for published sites.
+ *
+ * @param {InternalDatArchive} archive - site to crawl.
+ * @param {CrawlSourceRecord} crawlSource - internal metadata about the crawl target.
+ * @returns {Promise<void>}
+ */
+exports.crawlSite = async function (archive, crawlSource) {
+  return doCrawl(archive, crawlSource, 'crawl_published_sites', TABLE_VERSION, async ({changes, resetRequired}) => {
+    const supressEvents = resetRequired === true // dont emit when replaying old info
+    console.log('Crawling published sites for', archive.url, {changes, resetRequired})
+    if (resetRequired) {
+      // reset all data
+      await db.run(`
+        DELETE FROM crawl_published_sites WHERE crawlSourceId = ?
+      `, [crawlSource.id])
+      await doCheckpoint('crawl_published_sites', TABLE_VERSION, crawlSource, 0)
+    }
+
+    // did sites.json change?
+    var change = changes.find(c => c.name === JSON_PATH)
+    if (!change) {
+      return
+    }
+
+    emitProgressEvent(archive.url, 'crawl_published_sites', 0, 1)
+
+    // read and validate
+    try {
+      var sitesJson = await readSitesFile(archive)
+    } catch (err) {
+      console.error('Failed to read published-sites file', {url: archive.url, err})
+      debug('Failed to read published-sites file', {url: archive.url, err})
+      return
+    }
+
+    // diff against the current sites
+    var currentPublishedSites = /** @type string[] */(await listPublishedSites(archive.url))
+    var newSites = sitesJson.urls
+    var adds = _difference(newSites, currentPublishedSites)
+    var removes = _difference(currentPublishedSites, newSites)
+
+    // write updates
+    for (let add of adds) {
+      try {
+        await db.run(`
+          INSERT INTO crawl_published_sites (crawlSourceId, url, isConfirmedAuthor, crawledAt) VALUES (?, ?, ?, ?)
+        `, [crawlSource.id, add, 0, Date.now()])
+      } catch (e) {
+        if (e.code === 'SQLITE_CONSTRAINT') {
+          // uniqueness constraint probably failed, which means we got a duplicate somehow
+          // dont worry about it
+          debug('Attempted to insert duplicate published-site record', {crawlSource, url: add})
+        } else {
+          throw e
+        }
+      }
+      if (!supressEvents) {
+        events.emit('published-site-added', archive.url, add)
+      }
+    }
+    for (let remove of removes) {
+      await db.run(`
+        DELETE FROM crawl_published_sites WHERE crawlSourceId = ? AND url = ?
+      `, [crawlSource.id, remove])
+      if (supressEvents) {
+        events.emit('published-site-removed', archive.url, remove)
+      }
+    }
+
+    // write checkpoint as success
+    await doCheckpoint('crawl_published_sites', TABLE_VERSION, crawlSource, changes[changes.length - 1].version)
+    emitProgressEvent(archive.url, 'crawl_published_sites', 1, 1)
+  })
+}
+
+/**
+ * @description
+ * List sites published by subject.
+ *
+ * @param {string} subject - (URL)
+ * @param {Object} [opts]
+ * @param {string} [opts.type] - filter to the given type.
+ * @param {boolean} [opts.includeDesc] - output a site description instead of a simple URL.
+ * @returns {Promise<Array<string|SiteDescription>>}
+ */
+const listPublishedSites = exports.listPublishedSites = async function (subject, {type, includeDesc} = {}) {
+  var WHERE = ''
+  var queryParams = [subject]
+  if (type) {
+    WHERE = `WHERE (',' || type || ',') LIKE ?`
+    queryParams.push(`%,${type},%`)
+  }
+  var rows = await db.all(`
+    SELECT pub.url
+      FROM crawl_published_sites pub
+      INNER JOIN crawl_sources source
+          ON pub.crawlSourceId = source.id
+          AND source.url = ?
+      ${WHERE}
+  `, queryParams)
+  if (!includeDesc) {
+    return rows.map(row => toOrigin(row.url))
+  }
+  return Promise.all(rows.map(async (row) => {
+    return siteDescriptions.getBest({subject: toOrigin(row.url)})
+  }))
+}
+
+/**
+ * @description
+ * Check for the existence of a published site.
+ *
+ * @param {string} a - (URL) was this site published by 'b'?
+ * @param {string} b - (URL) did this site publish 'a'?
+ * @returns {Promise<boolean>}
+ */
+const isAPublishedByB = exports.isAPublishedByB = async function (a, b) {
+  a = toOrigin(a)
+  b = toOrigin(b)
+  var res = await db.get(`
+    SELECT pub.url
+      FROM crawl_published_sites pub
+      INNER JOIN crawl_sources source
+          ON pub.crawlSourceId = source.id
+          AND source.url = ?
+      WHERE
+        pub.url = ?
+  `, [b, a])
+  return !!res
+}
+
+/**
+ * @description
+ * Add a published site to the given archive.
+ *
+ * @param {InternalDatArchive} archive
+ * @param {string} siteUrl
+ * @returns {Promise<void>}
+ */
+exports.publishSite = async function (archive, siteUrl) {
+  // normalize siteUrl
+  siteUrl = toOrigin(siteUrl)
+  assert(typeof siteUrl === 'string', 'publishSite() must be given a valid URL')
+
+  // write new follows.json
+  await updateSitesFile(archive, sitesJson => {
+    if (!sitesJson.urls.find(v => v === siteUrl)) {
+      sitesJson.urls.push(siteUrl)
+    }
+  })
+
+  // capture site description
+  /* dont await */siteDescriptions.capture(archive, siteUrl)
+}
+
+/**
+ * @description
+ * Remove a published site from the given archive.
+ *
+ * @param {InternalDatArchive} archive
+ * @param {string} siteUrl
+ * @returns {Promise<void>}
+ */
+exports.unpublishSite = async function (archive, siteUrl) {
+  // normalize siteUrl
+  siteUrl = toOrigin(siteUrl)
+  assert(typeof siteUrl === 'string', 'unpublishSite() must be given a valid URL')
+
+  // write new follows.json
+  await updateSitesFile(archive, sitesJson => {
+    var i = sitesJson.urls.findIndex(v => v === siteUrl)
+    if (i !== -1) {
+      sitesJson.urls.splice(i, 1)
+    }
+  })
+}
+
+// internal methods
+// =
+
+/**
+ * @param {string} url
+ * @returns {string}
+ */
+function toOrigin (url) {
+  try {
+    var urlParsed = new URL(url)
+    return urlParsed.protocol + '//' + urlParsed.hostname
+  } catch (e) {
+    return null
+  }
+}
+
+/**
+ * @param {InternalDatArchive} archive
+ * @returns {Promise<Object>}
+ */
+async function readSitesFile (archive) {
+  try {
+    var sitesJson = await archive.pda.readFile(JSON_PATH, 'utf8')
+  } catch (e) {
+    if (e.notFound) return {type: JSON_TYPE, urls: []} // empty default when not found
+    throw e
+  }
+  sitesJson = JSON.parse(sitesJson)
+  assert(typeof sitesJson === 'object', 'File be an object')
+  assert(sitesJson.type === JSON_TYPE, 'JSON type must be unwalled.garden/published-sites')
+  assert(Array.isArray(sitesJson.urls), 'JSON .urls must be an array of strings')
+  sitesJson.urls = sitesJson.urls.filter(v => typeof v === 'string').map(toOrigin)
+  return sitesJson
+}
+
+/**
+ * @param {InternalDatArchive} archive
+ * @param {function(Object): void} updateFn
+ * @returns {Promise<void>}
+ */
+async function updateSitesFile (archive, updateFn) {
+  var release = await lock('crawler:published-sites:' + archive.url)
+  try {
+    // read the follows file
+    try {
+      var sitesJson = await readSitesFile(archive)
+    } catch (err) {
+      if (err.notFound) {
+        // create new
+        sitesJson = {
+          type: JSON_TYPE,
+          urls: []
+        }
+      } else {
+        debug('Failed to read follows file', {url: archive.url, err})
+        throw err
+      }
+    }
+
+    // apply update
+    updateFn(sitesJson)
+
+    // write the follows file
+    await archive.pda.writeFile(JSON_PATH, JSON.stringify(sitesJson), 'utf8')
+
+    // trigger crawl now
+    await crawler.crawlSite(archive)
+  } finally {
+    release()
+  }
+}
diff --git a/crawler/search.js b/crawler/search.js
index e788c34c..ab08bf8d 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -42,8 +42,9 @@ const BUILTIN_PAGES = [
  *
  * @typedef {Object} SearchResults
  * @prop {number} highlightNonce - A number used to create perimeters around text that should be highlighted.
- * @prop {(null|Array<PeopleSearchResult>)} people
- * @prop {(null|Array<PostSearchResult>)} posts
+ * @prop {(null|PeopleSearchResult[])} people
+ * @prop {(null|PostSearchResult[])} posts
+ * @prop {(null|PageSearchResult[])} pages
  *
  * @typedef {Object} PeopleSearchResult
  * @prop {string} url
@@ -61,6 +62,16 @@ const BUILTIN_PAGES = [
  * @prop {string} content
  * @prop {number} createdAt
  * @prop {number} updatedAt
+ * 
+ * @typedef {Object} PageSearchResult
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {Array<string>} type
+ * @prop {string} thumbUrl
+ * @prop {Object} descAuthor
+ * @prop {string} descAuthor.url
+ * @prop {SiteDescription} author
  */
 
 // exported api
@@ -123,6 +134,7 @@ exports.listSuggestions = async function (query = '', opts = {}) {
  * @param {Object} [opts.types] - Content types to query. Defaults to all.
  * @param {boolean} [opts.types.people]
  * @param {boolean} [opts.types.posts]
+ * @param {boolean} [opts.types.pages]
  * @param {number} [opts.since] - Filter results to items created since the given timestamp.
  * @param {number} [opts.offset]
  * @param {number} [opts.limit = 20]
@@ -136,7 +148,8 @@ exports.listSearchResults = async function (opts) {
   var searchResults = {
     highlightNonce,
     people: null,
-    posts: null
+    posts: null,
+    pages: null
   }
   var {user, query, hops, types, since, offset, limit} = opts
   if (!types || typeof types !== 'object') {
@@ -271,6 +284,48 @@ exports.listSearchResults = async function (opts) {
       delete p.pathname
     }))
   }
+  if (types.pages) {
+    if (query) {
+      searchResults.pages = await db.all(`
+        SELECT
+            pub.url AS url,
+            pubSrc.url AS authorUrl,
+            SNIPPET(crawl_site_descriptions_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title,
+            SNIPPET(crawl_site_descriptions_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description
+          FROM crawl_site_descriptions_fts_index desc_fts
+          INNER JOIN crawl_site_descriptions desc ON desc.rowid = desc_fts.rowid
+          INNER JOIN crawl_published_sites pub ON pub.url = desc.url
+          INNER JOIN crawl_sources pubSrc ON pub.crawlSourceId = pubSrc.id
+          LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = pubSrc.url
+          WHERE
+            crawl_site_descriptions_fts_index MATCH ?
+            AND fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) -- site published by a me or a followed user
+          ORDER BY rank
+          LIMIT ?
+          OFFSET ?;
+      `, [query, limit, offset])
+    } else {
+      searchResults.pages = await db.all(`
+        SELECT pub.url AS url, pubSrc.url AS authorUrl
+          FROM crawl_published_sites pub
+          INNER JOIN crawl_sources pubSrc ON pub.crawlSourceId = pubSrc.id
+          LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = pubSrc.url
+          WHERE fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) -- site published by a me or a followed user
+          ORDER BY pub.crawledAt
+          LIMIT ?
+          OFFSET ?;
+      `, [limit, offset])
+    }
+    searchResults.pages = await Promise.all(searchResults.pages.map(async (p) => {
+      // fetch full records
+      var page = /**@type PageSearchResult*/(await siteDescriptions.getBest({subject: p.url, author: p.authorUrl}))
+      page.author = await siteDescriptions.getBest({subject: p.authorUrl})
+      // overwrite title and description so that highlighting can be included
+      if (p.title) page.title = p.title
+      if (p.description) page.description = p.description
+      return page
+    }))
+  }
 
   return searchResults
 }
diff --git a/crawler/site-descriptions.js b/crawler/site-descriptions.js
index 0b865875..3d8df8cb 100644
--- a/crawler/site-descriptions.js
+++ b/crawler/site-descriptions.js
@@ -122,7 +122,7 @@ exports.crawlSite = async function (archive, crawlSource) {
           DELETE FROM crawl_site_descriptions WHERE crawlSourceId = ? AND url = ?
         `, [crawlSource.id, url])
         await db.run(`
-          INSERT OR REPLACE INTO crawl_site_descriptions (crawlSourceId, crawledAt, url, title, description, type)
+          INSERT INTO crawl_site_descriptions (crawlSourceId, crawledAt, url, title, description, type)
             VALUES (?, ?, ?, ?, ?, ?)
         `, [crawlSource.id, Date.now(), url, desc.title, desc.description, desc.type.join(',')])
         events.emit('description-added', archive.url)
diff --git a/dat/daemon/index.js b/dat/daemon/index.js
index 8e9103db..2fb1d15c 100644
--- a/dat/daemon/index.js
+++ b/dat/daemon/index.js
@@ -105,7 +105,7 @@ const RPC_API = {
 
   /**
    * @method
-   * @param {*} opts 
+   * @param {*} opts
    */
   async setup (opts) {
     datPath = opts.datPath
diff --git a/dat/daemon/manifest.js b/dat/daemon/manifest.js
index 9fd66f7d..f4baab22 100644
--- a/dat/daemon/manifest.js
+++ b/dat/daemon/manifest.js
@@ -1,6 +1,6 @@
 /**
  * @typedef {import('../../dbs/archives').LibraryArchiveUserSettings} LibraryArchiveUserSettings
- *  
+ *
  * @typedef {Object} DatDaemon
  * @prop {function(DatDaemonSetupOpts): Promise<void>} setup
  * @prop {function(DatDaemonThrottleOpts): Promise<void>} setBandwidthThrottle
@@ -36,49 +36,49 @@
  * @prop {function(any=, ...any=): Promise<any>} ext_setSessionData
  * @prop {function(any=, ...any=): NodeJS.ReadableStream} ext_createDatPeersStream
  * NOTE: the ext_* methods are temporary so Im not going to bother documenting their types
- * 
+ *
  * @typedef {Object} DatDaemonSetupOpts
  * @prop {string} datPath
  * @prop {string[]} disallowedSavePaths
- * 
+ *
  * @typedef {Object} DatDaemonThrottleOpts
  * @prop {number} [up]
  * @prop {number} [down]
- * 
+ *
  * @typedef {Object} DatDaemonLoadArchiveOpts
  * @prop {string | Buffer} key
  * @prop {Buffer} [secretKey]
  * @prop {string} metaPath
  * @prop {LibraryArchiveUserSettings} userSettings
- * 
+ *
  * @typedef {Object} DatDaemonFSDiffListingOpts
  * @prop {boolean} [shallow] - Dont descend into changed folders (default true)
  * @prop {boolean} [compareContent] - Compare the actual content (default true)
  * @prop {string[]} [paths] - A whitelist of files to compare
  * @prop {string} [localSyncPath] - Override the archive localSyncPath
  * @prop {boolean} [addOnly] - Dont modify or remove any files (default false)
- * 
+ *
  * @typedef {Object} DatDaemonFSQueueSyncEventOpts
  * @prop {boolean} toFolder
  * @prop {boolean} toArchive
- * 
+ *
  * @typedef {Object} DatDaemonLoadedArchiveInfo
  * @prop {Buffer} discoveryKey
  * @prop {boolean} writable
- * 
+ *
  * @typedef {never} DatDaemonPeerInfo
  * TODO- what's in here?
- * 
+ *
  * @typedef {Object} DatDaemonPeerHistory
  * @prop {number} ts
  * @prop {number} peers
- * 
+ *
  * @typedef {Object} DatDaemonNetworkStats
  * @prop {number} downloadSpeed
  * @prop {number} uploadSpeed
  * @prop {number} downloadTotal
  * @prop {number} uploadTotal
- * 
+ *
  * @typedef {Object} DatDaemonArchiveInfo
  * @prop {number} version
  * @prop {number} size
@@ -86,10 +86,10 @@
  * @prop {DatDaemonPeerInfo[]} peerInfo
  * @prop {DatDaemonPeerHistory[]} peerHistory
  * @prop {DatDaemonNetworkStats} networkStats
- * 
+ *
  * @typedef {never} DatDaemonFSListingDiff
  * TODO - what's in here?
- * 
+ *
  * @typedef {never} DatDaemonFSFileDiff
  * TODO - what's in here?
  */
diff --git a/dat/garbage-collector.js b/dat/garbage-collector.js
index 6b50290d..e3acf2df 100644
--- a/dat/garbage-collector.js
+++ b/dat/garbage-collector.js
@@ -77,7 +77,7 @@ const collect = exports.collect = async function ({olderThan, isOwner} = {}) {
 // =
 
 /**
- * @param {number} time 
+ * @param {number} time
  */
 function schedule (time) {
   nextGCTimeout = setTimeout(collect, time)
diff --git a/dat/library.js b/dat/library.js
index ce75a818..c9a4cb2a 100644
--- a/dat/library.js
+++ b/dat/library.js
@@ -32,7 +32,7 @@ const DAT_DAEMON_MANIFEST = require('./daemon/manifest')
 /**
  * @typedef {import('./daemon/manifest').DatDaemon} DatDaemon
  * @typedef {import('../dbs/archives').LibraryArchiveRecord} LibraryArchiveRecord
- * 
+ *
  * @typedef {Object} InternalDatArchive
  * @prop {Buffer} key
  * @prop {string} url
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index a2310263..c5e15464 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -192,6 +192,17 @@ CREATE TABLE crawl_followgraph (
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
 
+-- crawled site publications
+CREATE TABLE crawl_published_sites (
+  crawlSourceId INTEGER NOT NULL,
+  crawledAt INTEGER,
+  
+  url TEXT NOT NULL,
+  isConfirmedAuthor INTEGER DEFAULT 0,
+
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+
 -- a list of the draft-dats for a master-dat
 -- deprecated
 CREATE TABLE archive_drafts (
diff --git a/dbs/schemas/profile-data.v24.sql.js b/dbs/schemas/profile-data.v24.sql.js
index eae3dcd7..320de6cc 100644
--- a/dbs/schemas/profile-data.v24.sql.js
+++ b/dbs/schemas/profile-data.v24.sql.js
@@ -88,5 +88,16 @@ CREATE TABLE crawl_followgraph (
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
 
+-- crawled site publications
+CREATE TABLE crawl_published_sites (
+  crawlSourceId INTEGER NOT NULL,
+  crawledAt INTEGER,
+  
+  url TEXT NOT NULL,
+  isConfirmedAuthor INTEGER DEFAULT 0,
+
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+
 PRAGMA user_version = 24;
 `
\ No newline at end of file
diff --git a/users/index.js b/users/index.js
index c0b0ef3b..b6c0c782 100644
--- a/users/index.js
+++ b/users/index.js
@@ -1,6 +1,7 @@
 const Events = require('events')
 const dat = require('../dat')
 const crawler = require('../crawler')
+const publishedSites = require('../crawler/published-sites')
 const followgraph = require('../crawler/followgraph')
 const db = require('../dbs/profile-data-db')
 const archivesDb = require('../dbs/archives')
@@ -18,7 +19,7 @@ const NUM_SIMULTANEOUS_CRAWLS = 10
 
 /**
  * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
- * 
+ *
  * @typedef {Object} User
  * @prop {string} url
  * @prop {InternalDatArchive} archive
@@ -135,7 +136,7 @@ exports.get = async function (url) {
   return await fetchUserInfo(user)
 }
 
-/** 
+/**
  * @return {Promise<User>}
  */
 const getDefault =
@@ -199,7 +200,7 @@ exports.remove = async function (url) {
 // =
 
 /**
- * @param {string} url 
+ * @param {string} url
  * @return {Promise<boolean>}
  */
 async function isUser (url) {
@@ -207,14 +208,14 @@ async function isUser (url) {
 }
 
 /**
- * Assembles a list of crawl targets based on the current database state. *
+ * Assembles a list of crawl targets based on the current database state.
  * Depends on NUM_SIMULTANEOUS_CRAWLS.
  *
  * This function will assemble the list using simple priority heuristics. The priorities are currently:
  *
  *  1. Followed sites
- *  2. Sites published by followed sites
- *  3. Sites followed by followed sites
+ *  2. Published sites
+ *  3. FoaFs
  *
  * The sites will be ordered by these priorities and then iterated linearly. The ordering within
  * the priority groupings will be according to URL for a deterministic but effectively random ordering.
@@ -231,8 +232,8 @@ async function selectNextCrawlTargets (user) {
   // get followed sites
   rows = rows.concat(await followgraph.listFollows(user.url))
 
-  // get sites published by followed sites
-  // TODO
+  // get sites published
+  rows = rows.concat(await publishedSites.listPublishedSites(user.url))
 
   // get sites followed by followed sites
   rows = rows.concat(await followgraph.listFoaFs(user.url))
@@ -255,7 +256,7 @@ async function selectNextCrawlTargets (user) {
 }
 
 /**
- * @param {Object} user 
+ * @param {Object} user
  * @returns {Promise<User>}
  */
 async function fetchUserInfo (user) {
@@ -272,7 +273,7 @@ async function fetchUserInfo (user) {
 }
 
 /**
- * @param {string} url 
+ * @param {string} url
  * @returns {string}
  */
 function normalizeUrl (url) {
@@ -280,7 +281,7 @@ function normalizeUrl (url) {
 }
 
 /**
- * @param {string} url 
+ * @param {string} url
  * @returns {Promise<void>}
  */
 async function validateUserUrl (url) {

From 5f6c8d6e0547f6b271c7bd0e1ec48cd4aa7fc73c Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 14 Jan 2019 18:19:59 -0600
Subject: [PATCH 060/245] Add image-collection and file-share sites to search
 output

---
 crawler/published-sites.js |   2 +-
 crawler/search.js          | 108 ++++++++++++++++++++++---------------
 2 files changed, 67 insertions(+), 43 deletions(-)

diff --git a/crawler/published-sites.js b/crawler/published-sites.js
index 57b068d5..9f12ce1a 100644
--- a/crawler/published-sites.js
+++ b/crawler/published-sites.js
@@ -23,7 +23,7 @@ const JSON_PATH = '/data/sites.json'
  * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
  * @typedef {import('./util').CrawlSourceRecord} CrawlSourceRecord
  * @typedef {import('./site-descriptions').SiteDescription} SiteDescription
- * 
+ *
  * @typedef {Object} PublishedSites
  * @prop {SiteDescription} author
  * @prop {SiteDescription[]} sites
diff --git a/crawler/search.js b/crawler/search.js
index ab08bf8d..b6b74801 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -45,6 +45,8 @@ const BUILTIN_PAGES = [
  * @prop {(null|PeopleSearchResult[])} people
  * @prop {(null|PostSearchResult[])} posts
  * @prop {(null|PageSearchResult[])} pages
+ * @prop {(null|PageSearchResult[])} images
+ * @prop {(null|PageSearchResult[])} files
  *
  * @typedef {Object} PeopleSearchResult
  * @prop {string} url
@@ -62,7 +64,7 @@ const BUILTIN_PAGES = [
  * @prop {string} content
  * @prop {number} createdAt
  * @prop {number} updatedAt
- * 
+ *
  * @typedef {Object} PageSearchResult
  * @prop {string} url
  * @prop {string} title
@@ -135,6 +137,8 @@ exports.listSuggestions = async function (query = '', opts = {}) {
  * @param {boolean} [opts.types.people]
  * @param {boolean} [opts.types.posts]
  * @param {boolean} [opts.types.pages]
+ * @param {boolean} [opts.types.images]
+ * @param {boolean} [opts.types.files]
  * @param {number} [opts.since] - Filter results to items created since the given timestamp.
  * @param {number} [opts.offset]
  * @param {number} [opts.limit = 20]
@@ -149,7 +153,9 @@ exports.listSearchResults = async function (opts) {
     highlightNonce,
     people: null,
     posts: null,
-    pages: null
+    pages: null,
+    images: null,
+    files: null
   }
   var {user, query, hops, types, since, offset, limit} = opts
   if (!types || typeof types !== 'object') {
@@ -285,47 +291,65 @@ exports.listSearchResults = async function (opts) {
     }))
   }
   if (types.pages) {
-    if (query) {
-      searchResults.pages = await db.all(`
-        SELECT
-            pub.url AS url,
-            pubSrc.url AS authorUrl,
-            SNIPPET(crawl_site_descriptions_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title,
-            SNIPPET(crawl_site_descriptions_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description
-          FROM crawl_site_descriptions_fts_index desc_fts
-          INNER JOIN crawl_site_descriptions desc ON desc.rowid = desc_fts.rowid
-          INNER JOIN crawl_published_sites pub ON pub.url = desc.url
-          INNER JOIN crawl_sources pubSrc ON pub.crawlSourceId = pubSrc.id
-          LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = pubSrc.url
-          WHERE
-            crawl_site_descriptions_fts_index MATCH ?
-            AND fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) -- site published by a me or a followed user
-          ORDER BY rank
-          LIMIT ?
-          OFFSET ?;
-      `, [query, limit, offset])
-    } else {
-      searchResults.pages = await db.all(`
-        SELECT pub.url AS url, pubSrc.url AS authorUrl
-          FROM crawl_published_sites pub
-          INNER JOIN crawl_sources pubSrc ON pub.crawlSourceId = pubSrc.id
-          LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = pubSrc.url
-          WHERE fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) -- site published by a me or a followed user
-          ORDER BY pub.crawledAt
-          LIMIT ?
-          OFFSET ?;
-      `, [limit, offset])
-    }
-    searchResults.pages = await Promise.all(searchResults.pages.map(async (p) => {
-      // fetch full records
-      var page = /**@type PageSearchResult*/(await siteDescriptions.getBest({subject: p.url, author: p.authorUrl}))
-      page.author = await siteDescriptions.getBest({subject: p.authorUrl})
-      // overwrite title and description so that highlighting can be included
-      if (p.title) page.title = p.title
-      if (p.description) page.description = p.description
-      return page
-    }))
+    searchResults.pages = await searchPublishedSites('web-page', {query, limit, offset, startHighlight, endHighlight, crawlSourceIds})
+  }
+  if (types.images) {
+    searchResults.images = await searchPublishedSites('image-collection', {query, limit, offset, startHighlight, endHighlight, crawlSourceIds})
+  }
+  if (types.files) {
+    searchResults.files = await searchPublishedSites('file-shares', {query, limit, offset, startHighlight, endHighlight, crawlSourceIds})
   }
 
   return searchResults
 }
+
+// internal methods
+// =
+
+async function searchPublishedSites(type, {query, limit, offset, startHighlight, endHighlight, crawlSourceIds}) {
+  var rows
+  if (query) {
+    rows = await db.all(`
+      SELECT
+          pub.url AS url,
+          pubSrc.url AS authorUrl,
+          SNIPPET(crawl_site_descriptions_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title,
+          SNIPPET(crawl_site_descriptions_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description
+        FROM crawl_site_descriptions_fts_index desc_fts
+        INNER JOIN crawl_site_descriptions desc ON desc.rowid = desc_fts.rowid
+        INNER JOIN crawl_published_sites pub ON pub.url = desc.url
+        INNER JOIN crawl_sources pubSrc ON pub.crawlSourceId = pubSrc.id
+        LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = pubSrc.url
+        WHERE
+          crawl_site_descriptions_fts_index MATCH ?
+          AND (',' || desc.type || ',') LIKE ?
+          AND fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) -- site published by a me or a followed user
+        ORDER BY rank
+        LIMIT ?
+        OFFSET ?;
+    `, [query, `%,${type},%`, limit, offset])
+  } else {
+    rows = await db.all(`
+      SELECT pub.url AS url, pubSrc.url AS authorUrl
+        FROM crawl_published_sites pub
+        INNER JOIN crawl_site_descriptions desc ON desc.url = pub.url
+        INNER JOIN crawl_sources pubSrc ON pub.crawlSourceId = pubSrc.id
+        LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = pubSrc.url
+        WHERE 
+          (',' || desc.type || ',') LIKE ?
+          AND fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) -- site published by a me or a followed user
+        ORDER BY pub.crawledAt
+        LIMIT ?
+        OFFSET ?;
+    `, [`%,${type},%`, limit, offset])
+  }
+  return Promise.all(rows.map(async (row) => {
+    // fetch full records
+    var result = /**@type PageSearchResult*/(await siteDescriptions.getBest({subject: row.url, author: row.authorUrl}))
+    result.author = await siteDescriptions.getBest({subject: row.authorUrl})
+    // overwrite title and description so that highlighting can be included
+    if (row.title) result.title = row.title
+    if (row.description) result.description = row.description
+    return result
+  }))
+}
\ No newline at end of file

From 57c5c155666abfb0f78ce9916499b8b1d725d72c Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 14 Jan 2019 21:10:30 -0600
Subject: [PATCH 061/245] Add site publishing to the beaker.archives api

---
 crawler/search.js                       |  2 +-
 web-apis/bg/archives.js                 | 53 ++++++++++++++++++++++++-
 web-apis/bg/followgraph.js              |  3 +-
 web-apis/fg/beaker.js                   |  2 +
 web-apis/manifests/internal/archives.js |  2 +
 5 files changed, 58 insertions(+), 4 deletions(-)

diff --git a/crawler/search.js b/crawler/search.js
index b6b74801..a21cc1d9 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -306,7 +306,7 @@ exports.listSearchResults = async function (opts) {
 // internal methods
 // =
 
-async function searchPublishedSites(type, {query, limit, offset, startHighlight, endHighlight, crawlSourceIds}) {
+async function searchPublishedSites (type, {query, limit, offset, startHighlight, endHighlight, crawlSourceIds}) {
   var rows
   if (query) {
     rows = await db.all(`
diff --git a/web-apis/bg/archives.js b/web-apis/bg/archives.js
index 6432e88c..b5700039 100644
--- a/web-apis/bg/archives.js
+++ b/web-apis/bg/archives.js
@@ -1,11 +1,15 @@
 const path = require('path')
+const assert = require('assert')
+const {URL} = require('url')
 const mkdirp = require('mkdirp')
 const jetpack = require('fs-jetpack')
+const globals = require('../../globals')
 const datDns = require('../../dat/dns')
 const datLibrary = require('../../dat/library')
 const datGC = require('../../dat/garbage-collector')
 const archivesDb = require('../../dbs/archives')
 const archiveDraftsDb = require('../../dbs/archive-drafts')
+const publishedSites  = require('../../crawler/published-sites')
 const {cbPromise} = require('../../lib/functions')
 const {timer} = require('../../lib/time')
 const lock = require('../../lib/lock')
@@ -48,6 +52,31 @@ module.exports = {
     return archivesDb.setUserSettings(0, key, opts)
   },
 
+  async publish (url) {
+    url = getOrigin(url)
+    assertString(url, 'Parameter one must be a URL')
+    var userSession = globals.userSessionAPI.getFor(this.sender)
+    if (!userSession) throw new Error('No active user session')
+    var userArchive = datLibrary.getArchive(userSession.url)
+
+    // ensure archive is owned and saved by the user
+    var info = await datLibrary.getArchiveInfo(url)
+    if (!info.isOwner) throw new Error('Must be the author of the site to publish it')
+    if (!info.userSettings.isSaved) throw new Error('Site must be saved to publish it')
+
+    return publishedSites.publishSite(userArchive, url)
+  },
+
+  async unpublish (url) {
+    url = getOrigin(url)
+    assertString(url, 'Parameter one must be a URL')
+    var userSession = globals.userSessionAPI.getFor(this.sender)
+    if (!userSession) throw new Error('No active user session')
+    var userArchive = datLibrary.getArchive(userSession.url)
+
+    return publishedSites.unpublishSite(userArchive, url)
+  },
+
   async remove (url) {
     var key = datLibrary.fromURLToKey(url)
     return archivesDb.setUserSettings(0, key, {isSaved: false})
@@ -83,7 +112,14 @@ module.exports = {
   },
 
   async list (query = {}) {
-    return datLibrary.queryArchives(query)
+    var userSession = globals.userSessionAPI.getFor(this.sender)
+    var archives = await datLibrary.queryArchives(query)
+    if (userSession) {
+      await Promise.all(archives.map(async (a) => {
+        a.isPublished = await publishedSites.isAPublishedByB(a.url, userSession.url)
+      }))
+    }
+    return archives
   },
 
   // folder sync
@@ -299,3 +335,18 @@ module.exports = {
     return datLibrary.createDebugStream()
   }
 }
+
+// internal methods
+// =
+
+function getOrigin (url) {
+  try {
+    url = new URL(url)
+    return url.protocol + '//' + url.hostname
+  } catch (e) {}
+  return null
+}
+
+function assertString (v, msg) {
+  assert(!!v && typeof v === 'string', msg)
+}
diff --git a/web-apis/bg/followgraph.js b/web-apis/bg/followgraph.js
index ad903df3..8f1ff478 100644
--- a/web-apis/bg/followgraph.js
+++ b/web-apis/bg/followgraph.js
@@ -1,7 +1,6 @@
 const globals = require('../../globals')
 const assert = require('assert')
-const {Url} = require('url')
-const {PermissionsError} = require('beaker-error-constants')
+const {URL} = require('url')
 const dat = require('../../dat')
 const followgraphCrawler = require('../../crawler/followgraph')
 
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index 819a0ec3..fe6e8a0c 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -35,6 +35,8 @@ exports.setup = function (rpc) {
     beaker.archives = new EventTarget()
     beaker.archives.status = archivesRPC.status
     beaker.archives.add = archivesRPC.add
+    beaker.archives.publish = archivesRPC.publish
+    beaker.archives.unpublish = archivesRPC.unpublish
     beaker.archives.setUserSettings = archivesRPC.setUserSettings
     beaker.archives.remove = archivesRPC.remove
     beaker.archives.bulkRemove = archivesRPC.bulkRemove
diff --git a/web-apis/manifests/internal/archives.js b/web-apis/manifests/internal/archives.js
index d6eecebc..5ee6a972 100644
--- a/web-apis/manifests/internal/archives.js
+++ b/web-apis/manifests/internal/archives.js
@@ -5,6 +5,8 @@ module.exports = {
   // local cache management and querying
   setUserSettings: 'promise',
   add: 'promise',
+  publish: 'promise',
+  unpublish: 'promise',
   remove: 'promise',
   bulkRemove: 'promise',
   delete: 'promise',

From 44041f6b436b9f45dd122aef1a3857a87b56aff6 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 15 Jan 2019 10:44:16 -0600
Subject: [PATCH 062/245] Fix: include search results (published sites) by the
 user

---
 crawler/search.js | 19 ++++++++++---------
 1 file changed, 10 insertions(+), 9 deletions(-)

diff --git a/crawler/search.js b/crawler/search.js
index a21cc1d9..8b871f37 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -233,7 +233,7 @@ exports.listSearchResults = async function (opts) {
           OFFSET ?;
       `, [user, userCrawlSourceId, limit, offset])
     }
-    searchResults.people = _uniqWith(searchResults.people, (a, b) => a.url === b.url)
+    searchResults.people = _uniqWith(searchResults.people, (a, b) => a.url === b.url) // remove duplicates
     await Promise.all(searchResults.people.map(async (p) => {
       // fetch additional info
       p.followedBy = await followgraph.listFollowers(p.url, {includeDesc: true})
@@ -291,13 +291,13 @@ exports.listSearchResults = async function (opts) {
     }))
   }
   if (types.pages) {
-    searchResults.pages = await searchPublishedSites('web-page', {query, limit, offset, startHighlight, endHighlight, crawlSourceIds})
+    searchResults.pages = await searchPublishedSites('web-page', {query, limit, offset, startHighlight, endHighlight, userCrawlSourceId, crawlSourceIds})
   }
   if (types.images) {
-    searchResults.images = await searchPublishedSites('image-collection', {query, limit, offset, startHighlight, endHighlight, crawlSourceIds})
+    searchResults.images = await searchPublishedSites('image-collection', {query, limit, offset, startHighlight, endHighlight, userCrawlSourceId, crawlSourceIds})
   }
   if (types.files) {
-    searchResults.files = await searchPublishedSites('file-shares', {query, limit, offset, startHighlight, endHighlight, crawlSourceIds})
+    searchResults.files = await searchPublishedSites('file-shares', {query, limit, offset, startHighlight, endHighlight, userCrawlSourceId, crawlSourceIds})
   }
 
   return searchResults
@@ -306,7 +306,7 @@ exports.listSearchResults = async function (opts) {
 // internal methods
 // =
 
-async function searchPublishedSites (type, {query, limit, offset, startHighlight, endHighlight, crawlSourceIds}) {
+async function searchPublishedSites (type, {query, limit, offset, startHighlight, endHighlight, userCrawlSourceId, crawlSourceIds}) {
   var rows
   if (query) {
     rows = await db.all(`
@@ -323,11 +323,11 @@ async function searchPublishedSites (type, {query, limit, offset, startHighlight
         WHERE
           crawl_site_descriptions_fts_index MATCH ?
           AND (',' || desc.type || ',') LIKE ?
-          AND fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) -- site published by a me or a followed user
+          AND (fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) OR pubSrc.id = ?) -- site published by a me or a followed user
         ORDER BY rank
         LIMIT ?
         OFFSET ?;
-    `, [query, `%,${type},%`, limit, offset])
+    `, [query, `%,${type},%`, userCrawlSourceId, limit, offset])
   } else {
     rows = await db.all(`
       SELECT pub.url AS url, pubSrc.url AS authorUrl
@@ -337,12 +337,13 @@ async function searchPublishedSites (type, {query, limit, offset, startHighlight
         LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = pubSrc.url
         WHERE 
           (',' || desc.type || ',') LIKE ?
-          AND fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) -- site published by a me or a followed user
+          AND (fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) OR pubSrc.id = ?) -- site published by a me or a followed user
         ORDER BY pub.crawledAt
         LIMIT ?
         OFFSET ?;
-    `, [`%,${type},%`, limit, offset])
+    `, [`%,${type},%`, userCrawlSourceId, limit, offset])
   }
+  rows = _uniqWith(rows, (a, b) => a.url === b.url) // remove duplicates
   return Promise.all(rows.map(async (row) => {
     // fetch full records
     var result = /**@type PageSearchResult*/(await siteDescriptions.getBest({subject: row.url, author: row.authorUrl}))

From 8102e29a2b7b6461b6856c521e5c3400c176306b Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 15 Jan 2019 10:44:38 -0600
Subject: [PATCH 063/245] Fix: crawl the user

---
 users/index.js | 13 +++++++++----
 1 file changed, 9 insertions(+), 4 deletions(-)

diff --git a/users/index.js b/users/index.js
index b6c0c782..e07c83a5 100644
--- a/users/index.js
+++ b/users/index.js
@@ -213,9 +213,10 @@ async function isUser (url) {
  *
  * This function will assemble the list using simple priority heuristics. The priorities are currently:
  *
- *  1. Followed sites
- *  2. Published sites
- *  3. FoaFs
+ *  1. Self
+ *  2. Followed sites
+ *  3. Published sites
+ *  4. FoaFs
  *
  * The sites will be ordered by these priorities and then iterated linearly. The ordering within
  * the priority groupings will be according to URL for a deterministic but effectively random ordering.
@@ -227,7 +228,8 @@ async function isUser (url) {
  * @returns {Promise<Array<string>>}
  */
 async function selectNextCrawlTargets (user) {
-  var rows = []
+  // get self
+  var rows = [user.url]
 
   // get followed sites
   rows = rows.concat(await followgraph.listFollows(user.url))
@@ -238,6 +240,9 @@ async function selectNextCrawlTargets (user) {
   // get sites followed by followed sites
   rows = rows.concat(await followgraph.listFoaFs(user.url))
 
+  // get sites published by followed sites
+  // TODO
+
   // assemble into list
   var start = user.crawlSelectorCursor || 0
   if (start > rows.length) start = 0

From 85f7ec1baf190c0203ddd1b68a0c11986dab6040 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 15 Jan 2019 12:55:29 -0600
Subject: [PATCH 064/245] Add isPublished to trusted archive getInfo response

---
 web-apis/bg/dat-archive.js | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/web-apis/bg/dat-archive.js b/web-apis/bg/dat-archive.js
index 184b230a..25dc6915 100644
--- a/web-apis/bg/dat-archive.js
+++ b/web-apis/bg/dat-archive.js
@@ -5,6 +5,7 @@ const parseDatURL = require('parse-dat-url')
 const pda = require('pauls-dat-api')
 const concat = require('concat-stream')
 const pick = require('lodash.pick')
+const publishedSites  = require('../../crawler/published-sites')
 const datDns = require('../../dat/dns')
 const datLibrary = require('../../dat/library')
 const archivesDb = require('../../dbs/archives')
@@ -148,6 +149,9 @@ module.exports = {
 
       // request from beaker internal sites: give all data
       if (this.sender.getURL().startsWith('beaker:')) {
+        // add publish information
+        var userSession = globals.userSessionAPI.getFor(this.sender)
+        info.isPublished = await publishedSites.isAPublishedByB(url, userSession.url)
         // check that the local sync path is valid
         if (info && info.userSettings.localSyncPath) {
           const stat = await new Promise(resolve => {

From a7dd47eb91836a0fff7f71f3fa865d484dcacb87 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 15 Jan 2019 19:26:18 -0600
Subject: [PATCH 065/245] Handle 'all'-type searches better

---
 crawler/search.js | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/crawler/search.js b/crawler/search.js
index 8b871f37..ea3c1be3 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -159,7 +159,13 @@ exports.listSearchResults = async function (opts) {
   }
   var {user, query, hops, types, since, offset, limit} = opts
   if (!types || typeof types !== 'object') {
-    types = {people: true, posts: true}
+    types = {}
+    // default to all
+    for (var k in searchResults) {
+      if (k !== 'highlightNonce') {
+        types[k] = true
+      }
+    }
   }
   since = since || 0
   offset = offset || 0

From b3fc151c46b015a4bda3ab786bac46a26b0ad30b Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 19 Jan 2019 19:31:11 -0600
Subject: [PATCH 066/245] Disable the timeline links for now

---
 crawler/search.js | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/crawler/search.js b/crawler/search.js
index ea3c1be3..a5698b80 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -11,7 +11,7 @@ const {getSiteDescriptionThumbnailUrl} = require('./util')
 
 /** @type {Array<Object>} */
 const BUILTIN_PAGES = [
-  {title: 'Timeline', url: 'beaker://timeline'},
+  // {title: 'Timeline', url: 'beaker://timeline'}, DISABLED -prf
   {title: 'Your Library', url: 'beaker://library'},
   {title: 'Search', url: 'beaker://search'},
   {title: 'Bookmarks', url: 'beaker://bookmarks'},

From c34df5024960b348694e3928039d352bc0600ea1 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 20 Jan 2019 15:56:29 -0600
Subject: [PATCH 067/245] Introduce new logger

---
 crawler/followgraph.js       |  19 ++--
 crawler/index.js             |  15 +--
 crawler/posts.js             |  29 ++++--
 crawler/published-sites.js   |  19 ++--
 crawler/site-descriptions.js |  33 ++++---
 crawler/util.js              |   1 -
 dat/garbage-collector.js     |  14 ++-
 dat/protocol.js              |  44 ++++-----
 dat/watchlist.js             |   5 +-
 index.js                     |   3 +
 lib/db.js                    |   6 +-
 logger.js                    |  94 +++++++++++++++++++
 package-lock.json            | 174 ++++++++++++++++++++++++++++++++++-
 package.json                 |   1 +
 users/index.js               |  14 +--
 15 files changed, 385 insertions(+), 86 deletions(-)
 create mode 100644 logger.js

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index 6b27c6b8..420201a7 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -2,12 +2,12 @@ const assert = require('assert')
 const _difference = require('lodash.difference')
 const Events = require('events')
 const {URL} = require('url')
+const logger = require('../logger').child({category: 'crawler', dataset: 'followgraph'})
 const lock = require('../lib/lock')
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
 const siteDescriptions = require('./site-descriptions')
 const {doCrawl, doCheckpoint, emitProgressEvent} = require('./util')
-const debug = require('../lib/debug-logger').debugLogger('crawler')
 
 // constants
 // =
@@ -48,9 +48,10 @@ exports.removeListener = events.removeListener.bind(events)
 exports.crawlSite = async function (archive, crawlSource) {
   return doCrawl(archive, crawlSource, 'crawl_followgraph', TABLE_VERSION, async ({changes, resetRequired}) => {
     const supressEvents = resetRequired === true // dont emit when replaying old info
-    console.log('Crawling follows for', archive.url, {changes, resetRequired})
+    logger.silly('Crawling follows', {url: archive.url, numChanges: changes.length, resetRequired})
     if (resetRequired) {
       // reset all data
+      logger.silly('Resetting dataset', {url: archive.url})
       await db.run(`
         DELETE FROM crawl_followgraph WHERE crawlSourceId = ?
       `, [crawlSource.id])
@@ -60,17 +61,21 @@ exports.crawlSite = async function (archive, crawlSource) {
     // did follows.json change?
     var change = changes.find(c => c.name === JSON_PATH)
     if (!change) {
+      logger.silly('No change detected to follows record, aborting', {url: archive.url})
+      if (changes.length) {
+        await doCheckpoint('crawl_followgraph', TABLE_VERSION, crawlSource, changes[changes.length - 1].version)
+      }
       return
     }
 
+    logger.silly('Change detected to follows record', {url: archive.url})
     emitProgressEvent(archive.url, 'crawl_followgraph', 0, 1)
 
     // read and validate
     try {
       var followsJson = await readFollowsFile(archive)
     } catch (err) {
-      console.error('Failed to read follows file', {url: archive.url, err})
-      debug('Failed to read follows file', {url: archive.url, err})
+      logger.warn('Failed to read follows file', {url: archive.url, err})
       return
     }
 
@@ -79,6 +84,7 @@ exports.crawlSite = async function (archive, crawlSource) {
     var newFollows = followsJson.urls
     var adds = _difference(newFollows, currentFollows)
     var removes = _difference(currentFollows, newFollows)
+    logger.silly(`Adding ${adds.length} follows and removing ${removes.length} follows`, {url: archive.url})
 
     // write updates
     for (let add of adds) {
@@ -90,7 +96,7 @@ exports.crawlSite = async function (archive, crawlSource) {
         if (e.code === 'SQLITE_CONSTRAINT') {
           // uniqueness constraint probably failed, which means we got a duplicate somehow
           // dont worry about it
-          debug('Attempted to insert duplicate followgraph record', {crawlSource, url: add})
+          logger.warn('Attempted to insert duplicate followgraph record', {url: archive.url, add})
         } else {
           throw e
         }
@@ -109,6 +115,7 @@ exports.crawlSite = async function (archive, crawlSource) {
     }
 
     // write checkpoint as success
+    logger.silly(`Finished crawling follows`, {url: archive.url})
     await doCheckpoint('crawl_followgraph', TABLE_VERSION, crawlSource, changes[changes.length - 1].version)
     emitProgressEvent(archive.url, 'crawl_followgraph', 1, 1)
   })
@@ -350,7 +357,7 @@ async function updateFollowsFile (archive, updateFn) {
           urls: []
         }
       } else {
-        debug('Failed to read follows file', {url: archive.url, err})
+        logger.warn('Failed to read follows file', {url: archive.url, err})
         throw err
       }
     }
diff --git a/crawler/index.js b/crawler/index.js
index 3d3df79c..5755f8d0 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -1,10 +1,9 @@
 const emitStream = require('emit-stream')
-const {URL} = require('url')
 const _throttle = require('lodash.throttle')
+const logger = require('../logger').category('crawler')
 const lock = require('../lib/lock')
 const db = require('../dbs/profile-data-db')
 const archivesDb = require('../dbs/archives')
-const users = require('../users')
 const dat = require('../dat')
 
 const {crawlerEvents, toHostname} = require('./util')
@@ -28,13 +27,14 @@ exports.siteDescriptions = siteDescriptions
 const createEventsStream = exports.createEventsStream = () => emitStream(crawlerEvents)
 
 exports.setup = async function () {
+  logger.verbose('Crawler initialized')
 }
 
 exports.watchSite = async function (archive) {
   if (typeof archive === 'string') {
     archive = await dat.library.getOrLoadArchive(archive)
   }
-  console.log('watchSite', archive.url)
+  logger.silly('Watching site', {url: archive.url})
 
   if (!(archive.url in watches)) {
     crawlerEvents.emit('watch', {sourceUrl: archive.url})
@@ -44,7 +44,7 @@ exports.watchSite = async function (archive) {
     watches[archive.url] = archive.pda.watch()
     watches[archive.url].on('data', ([event, args]) => {
       // BUG watch is really inconsistent -prf
-      console.log('MIRACLE ALERT! The crawler watch stream emitted a change event', archive.url, event, args)
+      logger.debug('MIRACLE ALERT! The crawler watch stream emitted a change event', {url: archive.url, event, args})
       if (event === 'invalidated') {
         queueCrawl()
       }
@@ -58,6 +58,7 @@ exports.watchSite = async function (archive) {
 exports.unwatchSite = async function (url) {
   // stop watching for file changes
   if (url in watches) {
+    logger.silly('Unwatching site', {url})
     crawlerEvents.emit('unwatch', {sourceUrl: url})
     watches[url].close()
     watches[url] = null
@@ -66,7 +67,7 @@ exports.unwatchSite = async function (url) {
 
 const crawlSite =
 exports.crawlSite = async function (archive) {
-  console.log('crawling', archive.url)
+  logger.silly('Crawling site', {url: archive.url})
   crawlerEvents.emit('crawl-start', {sourceUrl: archive.url})
   var release = await lock('crawl:' + archive.url)
   try {
@@ -85,9 +86,10 @@ exports.crawlSite = async function (archive) {
       siteDescriptions.crawlSite(archive, crawlSource)
     ])
   } catch (err) {
-    console.error('Crawler error', {sourceUrl: archive.url, err: err.toString()})
+    logger.error('Failed to crawl site', {sourceUrl: archive.url, err: err.toString()})
     crawlerEvents.emit('crawl-error', {sourceUrl: archive.url, err: err.toString()})
   } finally {
+    logger.silly('Finished crawling site', {url: archive.url})
     crawlerEvents.emit('crawl-finish', {sourceUrl: archive.url})
     release()
   }
@@ -119,6 +121,7 @@ exports.getCrawlStates = async function () {
 
 const resetSite =
 exports.resetSite = async function (url) {
+  logger.silly('Resetting site', {url})
   await db.run(`DELETE FROM crawl_sources WHERE url = ?`, [url])
 }
 
diff --git a/crawler/posts.js b/crawler/posts.js
index eaa291a2..5e66c3ae 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -1,11 +1,11 @@
 const assert = require('assert')
 const {URL} = require('url')
 const Events = require('events')
+const logger = require('../logger').child({category: 'crawler', dataset: 'posts'})
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
 const siteDescriptions = require('./site-descriptions')
 const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename} = require('./util')
-const debug = require('../lib/debug-logger').debugLogger('crawler')
 
 // constants
 // =
@@ -54,9 +54,10 @@ exports.removeListener = events.removeListener.bind(events)
 exports.crawlSite = async function (archive, crawlSource) {
   return doCrawl(archive, crawlSource, 'crawl_posts', TABLE_VERSION, async ({changes, resetRequired}) => {
     const supressEvents = resetRequired === true // dont emit when replaying old info
-    console.log('Crawling posts for', archive.url, {changes, resetRequired})
+    logger.silly('Crawling posts', {url: archive.url, numChanges: changes.length, resetRequired})
     if (resetRequired) {
       // reset all data
+      logger.silly('Resetting dataset', {url: archive.url})
       await db.run(`
         DELETE FROM crawl_posts WHERE crawlSourceId = ?
       `, [crawlSource.id])
@@ -65,15 +66,15 @@ exports.crawlSite = async function (archive, crawlSource) {
 
     // collect changed posts
     var changedPosts = getMatchingChangesInOrder(changes, JSON_PATH_REGEX)
-    console.log('collected changed posts', changedPosts)
+    logger.silly('Collected changed posts', {changedPosts: changedPosts.map(p => p.name)})
     emitProgressEvent(archive.url, 'crawl_posts', 0, changedPosts.length)
 
     // read and apply each post in order
     var progress = 0
     for (let changedPost of changedPosts) {
       // TODO Currently the crawler will abort reading the feed if any post fails to load
-      //      this means that a single bad or unreachable file can stop the forward progress of post indexing
-      //      to solve this, we need to find a way to tolerate bad post-files without losing our ability to efficiently detect new posts
+      //      this means that a single unreachable file can stop the forward progress of post indexing
+      //      to solve this, we need to find a way to tolerate unreachable post-files without losing our ability to efficiently detect new posts
       //      -prf
       if (changedPost.type === 'del') {
         // delete
@@ -82,18 +83,27 @@ exports.crawlSite = async function (archive, crawlSource) {
         `, [crawlSource.id, changedPost.name])
         events.emit('post-removed', archive.url)
       } else {
-        // read and validate
+        // read 
+        let postString
+        try {
+          postString = await archive.pda.readFile(changedPost.name, 'utf8')
+        } catch (err) {
+          logger.warn('Failed to read post file, aborting', {url: archive.url, name: changedPost.name, err})
+          return // abort indexing
+        }
+        
+        // parse and validate
         let post
         try {
-          post = JSON.parse(await archive.pda.readFile(changedPost.name, 'utf8'))
+          post = JSON.parse(postString)
           assert(typeof post === 'object', 'File be an object')
           assert(post.type === 'unwalled.garden/post', 'JSON type must be unwalled.garden/post')
           assert(typeof post.content === 'string', 'JSON content must be a string')
           assert(typeof post.createdAt === 'string', 'JSON createdAt must be a date-time')
           assert(!isNaN(Number(new Date(post.createdAt))), 'JSON createdAt must be a date-time')
         } catch (err) {
-          debug('Failed to read post file', {url: archive.url, name: changedPost.name, err})
-          return // abort indexing
+          logger.warn('Failed to parse post file, skipping', {url: archive.url, name: changedPost.name, err})
+          continue // skip
         }
 
         // massage the post
@@ -120,6 +130,7 @@ exports.crawlSite = async function (archive, crawlSource) {
       }
 
       // checkpoint our progress
+      logger.silly(`Finished crawling posts`, {url: archive.url})
       await doCheckpoint('crawl_posts', TABLE_VERSION, crawlSource, changedPost.version)
       emitProgressEvent(archive.url, 'crawl_posts', ++progress, changedPosts.length)
     }
diff --git a/crawler/published-sites.js b/crawler/published-sites.js
index 9f12ce1a..143bfa80 100644
--- a/crawler/published-sites.js
+++ b/crawler/published-sites.js
@@ -2,12 +2,12 @@ const assert = require('assert')
 const _difference = require('lodash.difference')
 const Events = require('events')
 const {URL} = require('url')
+const logger = require('../logger').child({category: 'crawler', dataset: 'published-sites'})
 const lock = require('../lib/lock')
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
 const siteDescriptions = require('./site-descriptions')
 const {doCrawl, doCheckpoint, emitProgressEvent} = require('./util')
-const debug = require('../lib/debug-logger').debugLogger('crawler')
 
 // constants
 // =
@@ -52,9 +52,10 @@ exports.removeListener = events.removeListener.bind(events)
 exports.crawlSite = async function (archive, crawlSource) {
   return doCrawl(archive, crawlSource, 'crawl_published_sites', TABLE_VERSION, async ({changes, resetRequired}) => {
     const supressEvents = resetRequired === true // dont emit when replaying old info
-    console.log('Crawling published sites for', archive.url, {changes, resetRequired})
+    logger.silly('Crawling published sites', {url: archive.url, numChanges: changes.length, resetRequired})
     if (resetRequired) {
       // reset all data
+      logger.silly('Resetting dataset', {url: archive.url})
       await db.run(`
         DELETE FROM crawl_published_sites WHERE crawlSourceId = ?
       `, [crawlSource.id])
@@ -64,17 +65,21 @@ exports.crawlSite = async function (archive, crawlSource) {
     // did sites.json change?
     var change = changes.find(c => c.name === JSON_PATH)
     if (!change) {
+      logger.silly('No change detected to published-sites record, aborting', {url: archive.url})
+      if (changes.length) {
+        await doCheckpoint('crawl_published_sites', TABLE_VERSION, crawlSource, changes[changes.length - 1].version)
+      }
       return
     }
 
+    logger.silly('Change detected to published-sites record', {url: archive.url})
     emitProgressEvent(archive.url, 'crawl_published_sites', 0, 1)
 
     // read and validate
     try {
       var sitesJson = await readSitesFile(archive)
     } catch (err) {
-      console.error('Failed to read published-sites file', {url: archive.url, err})
-      debug('Failed to read published-sites file', {url: archive.url, err})
+      logger.warn('Failed to read published-sites file', {url: archive.url, err})
       return
     }
 
@@ -83,6 +88,7 @@ exports.crawlSite = async function (archive, crawlSource) {
     var newSites = sitesJson.urls
     var adds = _difference(newSites, currentPublishedSites)
     var removes = _difference(currentPublishedSites, newSites)
+    logger.silly(`Adding ${adds.length} sites and removing ${removes.length} sites`, {url: archive.url})
 
     // write updates
     for (let add of adds) {
@@ -94,7 +100,7 @@ exports.crawlSite = async function (archive, crawlSource) {
         if (e.code === 'SQLITE_CONSTRAINT') {
           // uniqueness constraint probably failed, which means we got a duplicate somehow
           // dont worry about it
-          debug('Attempted to insert duplicate published-site record', {crawlSource, url: add})
+          logger.warn('Attempted to insert duplicate published-site record', {url: archive.url, add})
         } else {
           throw e
         }
@@ -113,6 +119,7 @@ exports.crawlSite = async function (archive, crawlSource) {
     }
 
     // write checkpoint as success
+    logger.silly(`Finished crawling published sites`, {url: archive.url})
     await doCheckpoint('crawl_published_sites', TABLE_VERSION, crawlSource, changes[changes.length - 1].version)
     emitProgressEvent(archive.url, 'crawl_published_sites', 1, 1)
   })
@@ -274,7 +281,7 @@ async function updateSitesFile (archive, updateFn) {
           urls: []
         }
       } else {
-        debug('Failed to read follows file', {url: archive.url, err})
+        logger.warn('Failed to read published-sites file', {url: archive.url, err})
         throw err
       }
     }
diff --git a/crawler/site-descriptions.js b/crawler/site-descriptions.js
index 3d8df8cb..9bccd271 100644
--- a/crawler/site-descriptions.js
+++ b/crawler/site-descriptions.js
@@ -1,8 +1,8 @@
 const assert = require('assert')
 const {URL} = require('url')
 const Events = require('events')
+const logger = require('../logger').child({category: 'crawler', dataset: 'site-descriptions'})
 const db = require('../dbs/profile-data-db')
-const archivesDb = require('../dbs/archives')
 const dat = require('../dat')
 const crawler = require('./index')
 const {
@@ -10,11 +10,9 @@ const {
   doCheckpoint,
   emitProgressEvent,
   getMatchingChangesInOrder,
-  generateTimeFilename,
   getSiteDescriptionThumbnailUrl,
   toHostname
 } = require('./util')
-const debug = require('../lib/debug-logger').debugLogger('crawler')
 
 // constants
 // =
@@ -64,9 +62,10 @@ exports.removeListener = events.removeListener.bind(events)
 exports.crawlSite = async function (archive, crawlSource) {
   return doCrawl(archive, crawlSource, 'crawl_site_descriptions', TABLE_VERSION, async ({changes, resetRequired}) => {
     const supressEvents = resetRequired === true // dont emit when replaying old info
-    console.log('Crawling site descriptions for', archive.url, {changes, resetRequired})
+    logger.silly('Crawling site descriptions', {url: archive.url, numChanges: changes.length, resetRequired})
     if (resetRequired) {
       // reset all data
+      logger.silly('Resetting dataset', {url: archive.url})
       await db.run(`
         DELETE FROM crawl_site_descriptions WHERE crawlSourceId = ?
       `, [crawlSource.id])
@@ -75,14 +74,14 @@ exports.crawlSite = async function (archive, crawlSource) {
 
     // collect changed site descriptions
     var changedSiteDescriptions = getMatchingChangesInOrder(changes, JSON_PATH_REGEX)
-    console.log('collected changed site descriptions', changedSiteDescriptions)
+    logger.silly('Collected changed site-descriptions', {changedPosts: changedSiteDescriptions.map(p => p.name)})
     emitProgressEvent(archive.url, 'crawl_site_descriptions', 0, changedSiteDescriptions.length)
 
     // read and apply each post in order
     var progress = 0
     for (let changedSiteDescription of changedSiteDescriptions) {
       // TODO Currently the crawler will abort reading the feed if any description fails to load
-      //      this means that a single bad or unreachable file can stop the forward progress of description indexing
+      //      this means that a single unreachable file can stop the forward progress of description indexing
       //      to solve this, we need to find a way to tolerate bad description-files without losing our ability to efficiently detect new posts
       //      -prf
 
@@ -96,15 +95,23 @@ exports.crawlSite = async function (archive, crawlSource) {
         `, [crawlSource.id, url])
         events.emit('description-removed', archive.url)
       } else {
-        // read and validate
+        // read 
+        let descString
+        try {
+          descString = await archive.pda.readFile(changedSiteDescription.name, 'utf8')
+        } catch (err) {
+          logger.warn('Failed to read dat.json file, aborting', {url: archive.url, name: changedSiteDescription.name, err})
+          return // abort indexing
+        }
+        
+        // parse and validate
         let desc
         try {
-          desc = JSON.parse(await archive.pda.readFile(changedSiteDescription.name, 'utf8'))
+          desc = JSON.parse(descString)
           assert(typeof desc === 'object', 'File be an object')
         } catch (err) {
-          console.error('Failed to read site-description file', {url: archive.url, name: changedSiteDescription.name, err})
-          debug('Failed to read site-description file', {url: archive.url, name: changedSiteDescription.name, err})
-          return // abort indexing
+          logger.warn('Failed to parse dat.json file, aborting', {url: archive.url, name: changedSiteDescription.name, err})
+          continue // skip
         }
 
         // massage the description
@@ -129,6 +136,7 @@ exports.crawlSite = async function (archive, crawlSource) {
       }
 
       // checkpoint our progress
+      logger.silly(`Finished crawling site descriptions`, {url: archive.url})
       await doCheckpoint('crawl_site_descriptions', TABLE_VERSION, crawlSource, changedSiteDescription.version)
       emitProgressEvent(archive.url, 'crawl_site_descriptions', ++progress, changedSiteDescription.length)
     }
@@ -257,8 +265,7 @@ exports.capture = async function (archive, subject) {
   try {
     var datJson = JSON.parse(await subjectArchive.pda.readFile('/dat.json'))
   } catch (e) {
-    console.error('Failed to read dat.json of subject archive', e)
-    debug('Failed to read dat.json of subject archive', e)
+    logger.warn('Failed to read dat.json of subject archive', e)
     throw new Error('Unabled to read subject dat.json')
   }
   await archive.pda.writeFile(`/data/known_sites/${hostname}/dat.json`, JSON.stringify(datJson))
diff --git a/crawler/util.js b/crawler/util.js
index 6e0dae76..19582a4b 100644
--- a/crawler/util.js
+++ b/crawler/util.js
@@ -55,7 +55,6 @@ exports.doCrawl = async function (archive, crawlSource, crawlDataset, crawlDatas
   // fetch change log
   var start = state.crawlSourceVersion + 1
   var end = version + 1
-  console.log('fetching changes', archive.url, start, end, state)
   var changes = await new Promise((resolve, reject) => {
     pump(
       archive.history({start, end, timeout: READ_TIMEOUT}),
diff --git a/dat/garbage-collector.js b/dat/garbage-collector.js
index e3acf2df..c5f4359b 100644
--- a/dat/garbage-collector.js
+++ b/dat/garbage-collector.js
@@ -4,7 +4,7 @@ const {
   DAT_GC_FIRST_COLLECT_WAIT,
   DAT_GC_REGULAR_COLLECT_WAIT
 } = require('../lib/const')
-const debug = require('../lib/debug-logger').debugLogger('datgc')
+const logger = require('../logger').child({category: 'dat', subcategory: 'garbage-collector'})
 
 // typedefs
 // =
@@ -48,7 +48,9 @@ const collect = exports.collect = async function ({olderThan, isOwner} = {}) {
 
   // first unsave expired archives
   var expiredArchives = await archivesDb.listExpiredArchives()
-  debug('GC unsaving %d expired archives', expiredArchives.length)
+  if (expiredArchives.length) {
+    logger.info(`Unsaving ${expiredArchives.length} expired archives`)
+  }
   var promises = []
   for (let i = 0; i < expiredArchives.length; i++) {
     promises.push(archivesDb.setUserSettings(0, expiredArchives[i].key, {isSaved: false}))
@@ -57,14 +59,16 @@ const collect = exports.collect = async function ({olderThan, isOwner} = {}) {
 
   // now GC old archives
   var unusedArchives = await archivesDb.listGarbageCollectableArchives({olderThan, isOwner})
-  debug('GC cleaning out %d unused archives', unusedArchives.length)
-  debug(unusedArchives)
+  if (unusedArchives.length) {
+    logger.info(`Cleaning out ${unusedArchives.length} unused archives`)
+    logger.silly('Archives:', {urls: unusedArchives.map(a => a.key)})
+  }
   for (let i = 0; i < unusedArchives.length; i++) {
     await datLibrary.unloadArchive(unusedArchives[i].key)
     totalBytes += await archivesDb.deleteArchive(unusedArchives[i].key)
   }
 
-  debug('GC completed in %d ms', Date.now() - startTime)
+  logger.debug(`GC completed in ${Date.now() - startTime} ms`)
 
   // schedule the next GC
   schedule(DAT_GC_REGULAR_COLLECT_WAIT)
diff --git a/dat/protocol.js b/dat/protocol.js
index d146a752..4f74202a 100644
--- a/dat/protocol.js
+++ b/dat/protocol.js
@@ -2,7 +2,7 @@ const {join} = require('path')
 const parseDatUrl = require('parse-dat-url')
 const parseRange = require('range-parser')
 const once = require('once')
-const debug = require('../lib/debug-logger').debugLogger('dat-serve')
+const logger = require('../logger').child({category: 'dat', subcategory: 'dat-serve'})
 const intoStream = require('into-stream')
 const {toZipStream} = require('../lib/zip')
 const slugify = require('slugify')
@@ -17,17 +17,15 @@ const {makeSafe} = require('../lib/strings')
 
 // HACK detect whether the native builds of some key deps are working -prf
 // -prf
-try {
-  require('utp-native')
-} catch (err) {
-  debug('Failed to load utp-native. Peer-to-peer connectivity may be degraded.', err.toString())
-  console.error('Failed to load utp-native. Peer-to-peer connectivity may be degraded.', err)
+var utpLoadError = false
+try { require('utp-native') }
+catch (err) {
+  utpLoadError = err
 }
-try {
-  require('sodium-native')
-} catch (err) {
-  debug('Failed to load sodium-native. Performance may be degraded.', err.toString())
-  console.error('Failed to load sodium-native. Performance may be degraded.', err)
+var sodiumLoadError = false
+try { require('sodium-native') }
+catch (err) {
+  sodiumLoadError = err
 }
 
 // constants
@@ -40,6 +38,14 @@ const REQUEST_TIMEOUT_MS = 30e3 // 30 seconds
 // =
 
 exports.electronHandler = async function (request, respond) {
+  // log warnings now, after the logger has setup its transports
+  if (utpLoadError) {
+    logger.warn('Failed to load utp-native. Peer-to-peer connectivity may be degraded.', {err: utpLoadError.toString()})
+  }
+  if (sodiumLoadError) {
+    logger.warn('Failed to load sodium-native. Performance may be degraded.', {err: sodiumLoadError.toString()})
+  }
+
   respond = once(respond)
   var respondError = (code, status, errorPageInfo) => {
     if (errorPageInfo) {
@@ -90,7 +96,7 @@ exports.electronHandler = async function (request, respond) {
   const cleanup = () => clearTimeout(timeout)
   timeout = setTimeout(() => {
     // cleanup
-    debug('Timed out searching for', archiveKey)
+    logger.debug('Timed out searching for', {url: archiveKey})
     if (fileReadStream) {
       fileReadStream.destroy()
       fileReadStream = null
@@ -108,7 +114,7 @@ exports.electronHandler = async function (request, respond) {
     // start searching the network
     archive = await datLibrary.getOrLoadArchive(archiveKey)
   } catch (err) {
-    debug('Failed to open archive', archiveKey, err)
+    logger.warn('Failed to open archive', {url: archiveKey, err})
     cleanup()
     return respondError(500, 'Failed')
   }
@@ -131,7 +137,7 @@ exports.electronHandler = async function (request, respond) {
         errorDescription: `<span>You can open the <a class="link" href="${latestUrl}">latest published version</a> instead.</span>`
       })
     } else {
-      debug('Failed to open archive', archiveKey, err)
+      logger.warn('Failed to open archive checkout', {url: archiveKey, err})
       cleanup()
       return respondError(500, 'Failed')
     }
@@ -174,7 +180,7 @@ exports.electronHandler = async function (request, respond) {
     } else {
       // serve the zip
       var zs = toZipStream(checkoutFS, filepath)
-      zs.on('error', err => console.log('Error while producing .zip file', err))
+      zs.on('error', err => logger.error('Error while producing .zip file', err))
       return respond({
         statusCode: 200,
         headers,
@@ -184,7 +190,6 @@ exports.electronHandler = async function (request, respond) {
   }
 
   // lookup entry
-  debug('Attempting to lookup', archiveKey, filepath)
   var statusCode = 200
   var headers = {}
   var entry
@@ -262,8 +267,6 @@ exports.electronHandler = async function (request, respond) {
 
   // handle not found
   if (!entry) {
-    debug('Entry not found:', urlp.path)
-
     // check for a fallback page
     if (manifest && manifest.fallback_page && !urlp.query.disable_fallback_page) {
       await tryStat(manifest.fallback_page)
@@ -307,7 +310,6 @@ exports.electronHandler = async function (request, respond) {
     statusCode = 206
     headers['Content-Range'] = 'bytes ' + range.start + '-' + range.end + '/' + entry.size
     headers['Content-Length'] = range.end - range.start + 1
-    debug('Serving range:', range)
   } else {
     if (entry.size) {
       headers['Content-Length'] = entry.size
@@ -315,7 +317,6 @@ exports.electronHandler = async function (request, respond) {
   }
 
   // fetch the entry and stream the response
-  debug('Entry found:', entry.path)
   fileReadStream = checkoutFS.createReadStream(entry.path, range)
   var dataStream = fileReadStream
     .pipe(mime.identifyStream(entry.path, mimeType => {
@@ -352,7 +353,6 @@ exports.electronHandler = async function (request, respond) {
   fileReadStream.once('end', () => {
     if (!headersSent) {
       cleanup()
-      debug('Served empty file')
       respond({
         statusCode: 200,
         headers: {
@@ -366,7 +366,7 @@ exports.electronHandler = async function (request, respond) {
 
   // handle read-stream errors
   fileReadStream.once('error', err => {
-    debug('Error reading file', err)
+    logger.warn('Error reading file', {url: archive.url, path: entry.path, err})
     if (!headersSent) respondError(500, 'Failed to read file')
   })
 }
diff --git a/dat/watchlist.js b/dat/watchlist.js
index 3c4bdc93..1be83b1d 100644
--- a/dat/watchlist.js
+++ b/dat/watchlist.js
@@ -1,6 +1,6 @@
 const EventEmitter = require('events')
 const emitStream = require('emit-stream')
-const debug = require('../lib/debug-logger').debugLogger('datwatchlist')
+const logger = require('../logger').child({category: 'dat', subcategory: 'watchlist'})
 
 // dat modules
 const datLibrary = require('../dat/library')
@@ -22,8 +22,7 @@ exports.setup = async function setup () {
       watch(site)
     }
   } catch (err) {
-    console.error(err)
-    debug('Error while loading watchlist', err)
+    logger.error('Error while loading watchlist', {err})
     throw new Error('Failed to load the watchlist')
   }
 }
diff --git a/index.js b/index.js
index b20e6338..8ea92bc5 100644
--- a/index.js
+++ b/index.js
@@ -2,6 +2,7 @@ const assert = require('assert')
 const {join} = require('path')
 const debugLogger = require('./lib/debug-logger')
 const globals = require('./globals')
+const logger = require('./logger')
 const {getEnvVar} = require('./lib/env')
 const dat = require('./dat')
 const dbs = require('./dbs')
@@ -14,6 +15,7 @@ const spellCheckerLib = require('./lib/spell-checker')
 module.exports = {
   getEnvVar,
   globals,
+  logger,
   dat,
   dbs,
   crawler,
@@ -41,6 +43,7 @@ module.exports = {
     }
 
     // initiate log
+    logger.setup(join(opts.userDataPath, 'beaker.log'))
     debugLogger.setup(join(opts.userDataPath, 'debug.log'))
 
     // setup databases
diff --git a/lib/db.js b/lib/db.js
index 275fdaeb..3547d948 100644
--- a/lib/db.js
+++ b/lib/db.js
@@ -1,4 +1,4 @@
-const debug = require('../lib/debug-logger').debugLogger('beaker-sqlite')
+const logger = require('../logger').child({category: 'sqlite'})
 const FnQueue = require('function-queue')
 const { cbPromise } = require('./functions')
 
@@ -77,7 +77,7 @@ exports.setupSqliteDB = function (db, {setup, migrations}, logTag) {
       var neededMigrations = (version === 0 && setup) ? [setup] : migrations.slice(version)
       if (neededMigrations.length == 0) { return resolve() }
 
-      debug(logTag, 'Database at version', version, '; Running', neededMigrations.length, 'migrations')
+      logger.info(`${logTag} Database at version ${version}; Running ${neededMigrations.length} migrations`)
       runNeededMigrations()
       function runNeededMigrations (err) {
         if (err) return reject(err)
@@ -86,7 +86,7 @@ exports.setupSqliteDB = function (db, {setup, migrations}, logTag) {
         if (!migration) {
           // done
           resolve()
-          return debug(logTag, 'Database migrations completed without error')
+          return logger.info(`${logTag} Database migrations completed without error`)
         }
 
         migration(runNeededMigrations)
diff --git a/logger.js b/logger.js
new file mode 100644
index 00000000..130966a9
--- /dev/null
+++ b/logger.js
@@ -0,0 +1,94 @@
+const winston = require('winston')
+const concat = require('concat-stream')
+const pump = require('pump')
+const through2 = require('through2')
+const {combine, timestamp, json, simple, colorize, padLevels} = winston.format
+
+// typedefs
+// =
+
+/**
+ * @typedef {Object} LogStreamOpts
+ * @prop {number} [from] - Start time
+ * @prop {number} [to] - End time
+ * @prop {number} [offset] - Event-slice offset
+ * @prop {number} [limit] - Max number of objects to output
+ * @prop {any} [filters] - Attribute filters
+ */
+
+// globals
+// =
+
+const logger = winston.createLogger({
+  level: 'silly'
+})
+
+// exported api
+// =
+
+exports.setup = function (logPath) {
+  logger.add(new winston.transports.File({
+    filename: logPath,
+    format: combine(timestamp(), json())
+  }))
+  
+  // TODO if debug (pick an env var for this)
+  logger.add(new winston.transports.Console({
+    level: 'debug',
+    format: combine(colorize(), padLevels(), simple())
+  }))
+
+  logger.verbose('Program start')
+}
+
+exports.get = () => logger
+exports.category = (category) => logger.child({category})
+exports.child = (arg) => logger.child(arg)
+
+/**
+ * Query a slice of the log.
+ * @param {LogStreamOpts} [opts]
+ * @returns {Promise<Object[]>}
+ */
+exports.query = async (opts) => {
+  return new Promise((resolve, reject) => {
+    pump(
+      stream(opts),
+      concat({encoding: 'object'}, objs => resolve(/** @type any */(objs))),
+      reject
+    )
+  })
+}
+
+/**
+ * Create a read stream of the log.
+ * @param {LogStreamOpts} [opts]
+ * @returns {NodeJS.ReadStream}
+ */
+const stream = exports.stream = (opts = {}) => {
+  var n = 0
+
+  var filters = opts.filters
+  if (filters && typeof filters === 'object') {
+    // make each filter an array
+    for (let k in filters) {
+      filters[k] = Array.isArray(filters[k]) ? filters[k] : [filters[k]]
+    }
+  } else {
+    filters = false
+  }
+
+  var logStream = logger.stream({start: opts.offset || undefined})
+  return logStream.pipe(through2.obj((row, enc, cb) => {
+      var ts = (opts.from || opts.to) ? (new Date(row.timestamp)).getTime() : null
+      if ('from' in opts && ts < opts.from) return cb()
+      if ('to' in opts && ts > opts.to) return cb()
+      if (filters) {
+        for (let k in filters) {
+          if (!filters[k].includes(row[k])) return cb()
+        }
+      }
+      this.push(row)
+      if (opts.limit && ++n >= opts.limit) logStream.destroy()
+    }))
+}
diff --git a/package-lock.json b/package-lock.json
index abce505b..acedad44 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -192,6 +192,14 @@
       "resolved": "https://registry.npmjs.org/assign-symbols/-/assign-symbols-1.0.0.tgz",
       "integrity": "sha1-WWZ/QfrdTyDMvCu5a41Pf3jsA2c="
     },
+    "async": {
+      "version": "2.6.1",
+      "resolved": "https://registry.npmjs.org/async/-/async-2.6.1.tgz",
+      "integrity": "sha512-fNEiL2+AZt6AlAw/29Cr0UDe4sRAHCpEHh54WMz+Bb7QfNcFw4h3loofyJpLeQs4Yx7yuqu/2dLgM5hKOs6HlQ==",
+      "requires": {
+        "lodash": "^4.17.10"
+      }
+    },
     "asynckit": {
       "version": "0.4.0",
       "resolved": "https://registry.npmjs.org/asynckit/-/asynckit-0.4.0.tgz",
@@ -632,11 +640,19 @@
         "object-visit": "^1.0.0"
       }
     },
+    "color": {
+      "version": "3.0.0",
+      "resolved": "https://registry.npmjs.org/color/-/color-3.0.0.tgz",
+      "integrity": "sha512-jCpd5+s0s0t7p3pHQKpnJ0TpQKKdleP71LWcA0aqiljpiuAkOSUFN/dyH8ZwF0hRmFlrIuRhufds1QyEP9EB+w==",
+      "requires": {
+        "color-convert": "^1.9.1",
+        "color-string": "^1.5.2"
+      }
+    },
     "color-convert": {
       "version": "1.9.3",
       "resolved": "https://registry.npmjs.org/color-convert/-/color-convert-1.9.3.tgz",
       "integrity": "sha512-QfAUtd+vFdAtFQcC8CCyYt1fYWxSqAiK2cSD6zDB8N3cpsEBAvRxp9zOGg6G/SHHJYAT88/az/IuDGALsNVbGg==",
-      "dev": true,
       "requires": {
         "color-name": "1.1.3"
       }
@@ -644,8 +660,35 @@
     "color-name": {
       "version": "1.1.3",
       "resolved": "https://registry.npmjs.org/color-name/-/color-name-1.1.3.tgz",
-      "integrity": "sha1-p9BVi9icQveV3UIyj3QIMcpTvCU=",
-      "dev": true
+      "integrity": "sha1-p9BVi9icQveV3UIyj3QIMcpTvCU="
+    },
+    "color-string": {
+      "version": "1.5.3",
+      "resolved": "https://registry.npmjs.org/color-string/-/color-string-1.5.3.tgz",
+      "integrity": "sha512-dC2C5qeWoYkxki5UAXapdjqO672AM4vZuPGRQfO8b5HKuKGBbKWpITyDYN7TOFKvRW7kOgAn3746clDBMDJyQw==",
+      "requires": {
+        "color-name": "^1.0.0",
+        "simple-swizzle": "^0.2.2"
+      }
+    },
+    "colornames": {
+      "version": "1.1.1",
+      "resolved": "https://registry.npmjs.org/colornames/-/colornames-1.1.1.tgz",
+      "integrity": "sha1-+IiQMGhcfE/54qVZ9Qd+t2qBb5Y="
+    },
+    "colors": {
+      "version": "1.3.3",
+      "resolved": "https://registry.npmjs.org/colors/-/colors-1.3.3.tgz",
+      "integrity": "sha512-mmGt/1pZqYRjMxB1axhTo16/snVZ5krrKkcmMeVKxzECMMXoCgnvTPp10QgHfcbQZw8Dq2jMNG6je4JlWU0gWg=="
+    },
+    "colorspace": {
+      "version": "1.1.1",
+      "resolved": "https://registry.npmjs.org/colorspace/-/colorspace-1.1.1.tgz",
+      "integrity": "sha512-pI3btWyiuz7Ken0BWh9Elzsmv2bM9AhA7psXib4anUXy/orfZ/E0MbQwhSOG/9L8hLlalqrU0UhOuqxW1YjmVw==",
+      "requires": {
+        "color": "3.0.x",
+        "text-hex": "1.0.x"
+      }
     },
     "combined-stream": {
       "version": "1.0.7",
@@ -840,6 +883,16 @@
       "resolved": "https://registry.npmjs.org/detect-libc/-/detect-libc-1.0.3.tgz",
       "integrity": "sha1-+hN8S9aY7fVc1c0CrFWfkaTEups="
     },
+    "diagnostics": {
+      "version": "1.1.1",
+      "resolved": "https://registry.npmjs.org/diagnostics/-/diagnostics-1.1.1.tgz",
+      "integrity": "sha512-8wn1PmdunLJ9Tqbx+Fx/ZEuHfJf4NKSN2ZBj7SJC/OWRWha843+WsTjqMe1B5E3p28jqBlp+mJ2fPVxPyNgYKQ==",
+      "requires": {
+        "colorspace": "1.1.x",
+        "enabled": "1.0.x",
+        "kuler": "1.0.x"
+      }
+    },
     "diff": {
       "version": "3.5.0",
       "resolved": "https://registry.npmjs.org/diff/-/diff-3.5.0.tgz",
@@ -997,6 +1050,14 @@
         "through": "~2.3.4"
       }
     },
+    "enabled": {
+      "version": "1.0.2",
+      "resolved": "https://registry.npmjs.org/enabled/-/enabled-1.0.2.tgz",
+      "integrity": "sha1-ll9lE9LC0cX0ZStkouM5ZGf8L5M=",
+      "requires": {
+        "env-variable": "0.0.x"
+      }
+    },
     "end-of-stream": {
       "version": "1.4.1",
       "resolved": "https://registry.npmjs.org/end-of-stream/-/end-of-stream-1.4.1.tgz",
@@ -1005,6 +1066,11 @@
         "once": "^1.4.0"
       }
     },
+    "env-variable": {
+      "version": "0.0.5",
+      "resolved": "https://registry.npmjs.org/env-variable/-/env-variable-0.0.5.tgz",
+      "integrity": "sha512-zoB603vQReOFvTg5xMl9I1P2PnHsHQQKTEowsKKD7nseUfJq6UWzK+4YtlWUO1nhiQUxe6XMkk+JleSZD1NZFA=="
+    },
     "es6-promise": {
       "version": "4.2.5",
       "resolved": "https://registry.npmjs.org/es6-promise/-/es6-promise-4.2.5.tgz",
@@ -1408,6 +1474,16 @@
       "integrity": "sha1-PYpcZog6FqMMqGQ+hR8Zuqd5eRc=",
       "dev": true
     },
+    "fast-safe-stringify": {
+      "version": "2.0.6",
+      "resolved": "https://registry.npmjs.org/fast-safe-stringify/-/fast-safe-stringify-2.0.6.tgz",
+      "integrity": "sha512-q8BZ89jjc+mz08rSxROs8VsrBBcn1SIw1kq9NjolL509tkABRk9io01RAjSaEv1Xb2uFLt8VtRiZbGp5H8iDtg=="
+    },
+    "fecha": {
+      "version": "2.3.3",
+      "resolved": "https://registry.npmjs.org/fecha/-/fecha-2.3.3.tgz",
+      "integrity": "sha512-lUGBnIamTAwk4znq5BcqsDaxSmZ9nDVJaij6NvRt/Tg4R69gERA+otPKbS86ROw9nxVMw2/mp1fnaiWqbs6Sdg=="
+    },
     "figures": {
       "version": "2.0.0",
       "resolved": "https://registry.npmjs.org/figures/-/figures-2.0.0.tgz",
@@ -1980,6 +2056,11 @@
         }
       }
     },
+    "is-arrayish": {
+      "version": "0.3.2",
+      "resolved": "https://registry.npmjs.org/is-arrayish/-/is-arrayish-0.3.2.tgz",
+      "integrity": "sha512-eVRqCvVlZbuw3GrM63ovNSNAeA1K16kaR/LRY/92w0zxQ5/1YzwblUX652i4Xs9RwAGjW9d9y6X88t8OaAJfWQ=="
+    },
     "is-buffer": {
       "version": "1.1.6",
       "resolved": "https://registry.npmjs.org/is-buffer/-/is-buffer-1.1.6.tgz",
@@ -2261,6 +2342,14 @@
       "resolved": "https://registry.npmjs.org/kind-of/-/kind-of-6.0.2.tgz",
       "integrity": "sha512-s5kLOcnH0XqDO+FvuaLX8DDjZ18CGFk7VygH40QoKPUQhW4e2rvM0rwUq0t8IQDOwYSeLK01U90OjzBTme2QqA=="
     },
+    "kuler": {
+      "version": "1.0.1",
+      "resolved": "https://registry.npmjs.org/kuler/-/kuler-1.0.1.tgz",
+      "integrity": "sha512-J9nVUucG1p/skKul6DU3PUZrhs0LPulNaeUOox0IyXDi8S4CztTHs1gQphhuZmzXG7VOQSf6NJfKuzteQLv9gQ==",
+      "requires": {
+        "colornames": "^1.1.1"
+      }
+    },
     "last-one-wins": {
       "version": "1.0.4",
       "resolved": "https://registry.npmjs.org/last-one-wins/-/last-one-wins-1.0.4.tgz",
@@ -2307,8 +2396,7 @@
     "lodash": {
       "version": "4.17.11",
       "resolved": "https://registry.npmjs.org/lodash/-/lodash-4.17.11.tgz",
-      "integrity": "sha512-cQKh8igo5QUhZ7lg38DYWAxMvjSAKG0A8wGSVimP07SIUEK2UO+arSRKbRZWtelMtN5V0Hkwh5ryOto/SshYIg==",
-      "dev": true
+      "integrity": "sha512-cQKh8igo5QUhZ7lg38DYWAxMvjSAKG0A8wGSVimP07SIUEK2UO+arSRKbRZWtelMtN5V0Hkwh5ryOto/SshYIg=="
     },
     "lodash.debounce": {
       "version": "4.0.8",
@@ -2350,6 +2438,18 @@
       "resolved": "https://registry.npmjs.org/lodash.uniqwith/-/lodash.uniqwith-4.5.0.tgz",
       "integrity": "sha1-egy/ZfQ7WShiWp1NDcVLGMrcfvM="
     },
+    "logform": {
+      "version": "2.1.0",
+      "resolved": "https://registry.npmjs.org/logform/-/logform-2.1.0.tgz",
+      "integrity": "sha512-srZ6qfWCHLX0HVBuWiBC9CPWh61PFrj/akMSQTEqVOgik8fbpg849VU/kepesr6kBZ42Jsk8Duuabim6hAh27w==",
+      "requires": {
+        "colors": "^1.2.1",
+        "fast-safe-stringify": "^2.0.4",
+        "fecha": "^2.3.3",
+        "ms": "^2.1.1",
+        "triple-beam": "^1.2.0"
+      }
+    },
     "lru": {
       "version": "3.1.0",
       "resolved": "https://registry.npmjs.org/lru/-/lru-3.1.0.tgz",
@@ -2791,6 +2891,11 @@
         "wrappy": "1"
       }
     },
+    "one-time": {
+      "version": "0.0.4",
+      "resolved": "https://registry.npmjs.org/one-time/-/one-time-0.0.4.tgz",
+      "integrity": "sha1-+M33eISCb+Tf+T46nMN7HkSAdC4="
+    },
     "onetime": {
       "version": "2.0.1",
       "resolved": "https://registry.npmjs.org/onetime/-/onetime-2.0.1.tgz",
@@ -3456,6 +3561,14 @@
         "rusha": "^0.8.1"
       }
     },
+    "simple-swizzle": {
+      "version": "0.2.2",
+      "resolved": "https://registry.npmjs.org/simple-swizzle/-/simple-swizzle-0.2.2.tgz",
+      "integrity": "sha1-pNprY1/8zMoz9w0Xy5JZLeleVXo=",
+      "requires": {
+        "is-arrayish": "^0.3.1"
+      }
+    },
     "siphash24": {
       "version": "1.1.1",
       "resolved": "https://registry.npmjs.org/siphash24/-/siphash24-1.1.1.tgz",
@@ -3737,6 +3850,11 @@
         "tweetnacl": "~0.14.0"
       }
     },
+    "stack-trace": {
+      "version": "0.0.10",
+      "resolved": "https://registry.npmjs.org/stack-trace/-/stack-trace-0.0.10.tgz",
+      "integrity": "sha1-VHxws0fo0ytOEI6hoqFZ5f3eGcA="
+    },
     "static-extend": {
       "version": "0.1.2",
       "resolved": "https://registry.npmjs.org/static-extend/-/static-extend-0.1.2.tgz",
@@ -3949,6 +4067,11 @@
         }
       }
     },
+    "text-hex": {
+      "version": "1.0.0",
+      "resolved": "https://registry.npmjs.org/text-hex/-/text-hex-1.0.0.tgz",
+      "integrity": "sha512-uuVGNWzgJ4yhRaNSiubPY7OjISw4sw4E5Uv0wbjp+OzcbmVU/rsT8ujgcXJhn9ypzsgr5vlzpPqP+MBBKcGvbg=="
+    },
     "text-table": {
       "version": "0.2.0",
       "resolved": "https://registry.npmjs.org/text-table/-/text-table-0.2.0.tgz",
@@ -4052,6 +4175,11 @@
         }
       }
     },
+    "triple-beam": {
+      "version": "1.3.0",
+      "resolved": "https://registry.npmjs.org/triple-beam/-/triple-beam-1.3.0.tgz",
+      "integrity": "sha512-XrHUvV5HpdLmIj4uVMxHggLbFSZYIn7HEWsqePZcI50pco+MPqJ50wMGY794X7AOOhxOBAjbkqfAbEe/QMp2Lw=="
+    },
     "ttl": {
       "version": "1.3.1",
       "resolved": "https://registry.npmjs.org/ttl/-/ttl-1.3.1.tgz",
@@ -4284,6 +4412,42 @@
         "string-width": "^1.0.2 || 2"
       }
     },
+    "winston": {
+      "version": "github:winstonjs/winston#b4ced895b3e1ead8a616590189b003cfd9d7acca",
+      "from": "github:winstonjs/winston#b4ced895b3e1ead8a616590189b003cfd9d7acca",
+      "requires": {
+        "async": "^2.6.1",
+        "diagnostics": "^1.1.1",
+        "is-stream": "^1.1.0",
+        "logform": "^2.0.0",
+        "one-time": "0.0.4",
+        "readable-stream": "^3.1.1",
+        "stack-trace": "0.0.x",
+        "triple-beam": "^1.3.0",
+        "winston-transport": "^4.3.0"
+      },
+      "dependencies": {
+        "readable-stream": {
+          "version": "3.1.1",
+          "resolved": "https://registry.npmjs.org/readable-stream/-/readable-stream-3.1.1.tgz",
+          "integrity": "sha512-DkN66hPyqDhnIQ6Jcsvx9bFjhw214O4poMBcIMgPVpQvNy9a0e0Uhg5SqySyDKAmUlwt8LonTBz1ezOnM8pUdA==",
+          "requires": {
+            "inherits": "^2.0.3",
+            "string_decoder": "^1.1.1",
+            "util-deprecate": "^1.0.1"
+          }
+        }
+      }
+    },
+    "winston-transport": {
+      "version": "4.3.0",
+      "resolved": "https://registry.npmjs.org/winston-transport/-/winston-transport-4.3.0.tgz",
+      "integrity": "sha512-B2wPuwUi3vhzn/51Uukcao4dIduEiPOcOt9HJ3QeaXgkJ5Z7UwpBzxS4ZGNHtrxrUvTwemsQiSys0ihOf8Mp1A==",
+      "requires": {
+        "readable-stream": "^2.3.6",
+        "triple-beam": "^1.2.0"
+      }
+    },
     "wordwrap": {
       "version": "1.0.0",
       "resolved": "https://registry.npmjs.org/wordwrap/-/wordwrap-1.0.0.tgz",
diff --git a/package.json b/package.json
index f933fb4a..24257ada 100644
--- a/package.json
+++ b/package.json
@@ -83,6 +83,7 @@
     "textextensions": "^2.4.0",
     "through2": "^2.0.5",
     "utp-native": "^2.1.3",
+    "winston": "winstonjs/winston#b4ced895b3e1ead8a616590189b003cfd9d7acca",
     "yazl": "^2.5.1"
   },
   "devDependencies": {
diff --git a/users/index.js b/users/index.js
index e07c83a5..8f8770d4 100644
--- a/users/index.js
+++ b/users/index.js
@@ -1,11 +1,11 @@
 const Events = require('events')
+const logger = require('../logger').category('crawler')
 const dat = require('../dat')
 const crawler = require('../crawler')
 const publishedSites = require('../crawler/published-sites')
 const followgraph = require('../crawler/followgraph')
 const db = require('../dbs/profile-data-db')
 const archivesDb = require('../dbs/archives')
-const debug = require('../lib/debug-logger').debugLogger('users')
 
 // constants
 // =
@@ -51,13 +51,13 @@ exports.setup = async function () {
 
   // load the current users
   users = await db.all(`SELECT * FROM users`)
-  console.log('users loaded', users)
   users.forEach(async (user) => {
     // massage data
     user.url = normalizeUrl(user.url)
     user.archive = null
     user.isDefault = Boolean(user.isDefault)
     user.createdAt = new Date(user.createdAt)
+    logger.verbose('Loading user', user)
 
     // fetch the user archive
     try {
@@ -66,7 +66,7 @@ exports.setup = async function () {
       /* dont await */crawler.watchSite(user.archive)
       events.emit('load-user', user)
     } catch (err) {
-      debug('Failed to load user', {user, err})
+      logger.error('Failed to load user', {user, err})
     }
   })
 }
@@ -102,15 +102,14 @@ async function tick () {
           // TODO
         }
       } catch (e) {
-        console.error('Failed to crawl site', crawlTarget, e)
-        // TODO more handling?
+        // TODO handle?
       }
     })
 
     // await all crawls
     await Promise.all(activeCrawls)
   } catch (e) {
-    console.error('Crawler tick failed', e)
+    logger.error('Crawler tick failed', e)
   }
 
   // queue next tick
@@ -166,7 +165,7 @@ exports.add = async function (url) {
     isDefault: users.length === 0,
     createdAt: Date.now()
   }
-  console.log('adding new user', user)
+  logger.verbose('Adding user', user)
   await db.run(
     `INSERT INTO users (url, isDefault, createdAt) VALUES (?, ?, ?)`,
     [user.url, Number(user.isDefault), user.createdAt]
@@ -190,6 +189,7 @@ exports.remove = async function (url) {
   if (!user) return
 
   // remove the user
+  logger.verbose('Removing user', user)
   users.splice(users.indexOf(user), 1)
   await db.run(`DELETE FROM users WHERE url = ?`, [user.url])
   /* dont await */crawler.unwatchSite(user.archive)

From 16db29229e4e52e2b30fbe38df8708d16b1d6ae3 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 20 Jan 2019 18:36:04 -0600
Subject: [PATCH 068/245] Add beaker.logger web api

---
 web-apis/bg.js                        | 3 +++
 web-apis/fg/beaker.js                 | 7 +++++++
 web-apis/manifests/internal/logger.js | 4 ++++
 3 files changed, 14 insertions(+)
 create mode 100644 web-apis/manifests/internal/logger.js

diff --git a/web-apis/bg.js b/web-apis/bg.js
index df7bfd95..207d0326 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -3,6 +3,7 @@ const globals = require('../globals')
 const SECURE_ORIGIN_REGEX = /^(beaker:|dat:|https:|http:\/\/localhost(\/|:))/i
 
 // internal manifests
+const loggerManifest = require('./manifests/internal/logger')
 const archivesManifest = require('./manifests/internal/archives')
 const beakerBrowserManifest = require('./manifests/internal/browser')
 const bookmarksManifest = require('./manifests/internal/bookmarks')
@@ -16,6 +17,7 @@ const postsManifest = require('./manifests/internal/posts')
 const followgraphManifest = require('./manifests/internal/followgraph')
 
 // internal apis
+const loggerAPI = require('../logger').WEBAPI
 const archivesAPI = require('./bg/archives')
 const bookmarksAPI = require('./bg/bookmarks')
 const historyAPI = require('./bg/history')
@@ -51,6 +53,7 @@ const experimentalLibraryAPI = require('./bg/experimental/library')
 
 exports.setup = function () {
   // internal apis
+  globals.rpcAPI.exportAPI('logger', loggerManifest, loggerAPI, internalOnly)
   globals.rpcAPI.exportAPI('archives', archivesManifest, archivesAPI, internalOnly)
   globals.rpcAPI.exportAPI('beaker-browser', beakerBrowserManifest, globals.browserWebAPI, internalOnly)
   globals.rpcAPI.exportAPI('bookmarks', bookmarksManifest, bookmarksAPI, internalOnly)
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index fe6e8a0c..f6fc92b7 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -1,6 +1,7 @@
 const { EventTarget, bindEventStream, fromEventStream } = require('./event-target')
 const errors = require('beaker-error-constants')
 
+const loggerManifest = require('../manifests/internal/logger')
 const archivesManifest = require('../manifests/internal/archives')
 const beakerBrowserManifest = require('../manifests/internal/browser')
 const bookmarksManifest = require('../manifests/internal/bookmarks')
@@ -19,6 +20,7 @@ exports.setup = function (rpc) {
 
   // internal only
   if (window.location.protocol === 'beaker:') {
+    const loggerRPC = rpc.importAPI('logger', loggerManifest, opts)
     const archivesRPC = rpc.importAPI('archives', archivesManifest, opts)
     const beakerBrowserRPC = rpc.importAPI('beaker-browser', beakerBrowserManifest, opts)
     const bookmarksRPC = rpc.importAPI('bookmarks', bookmarksManifest, opts)
@@ -31,6 +33,11 @@ exports.setup = function (rpc) {
     const postsRPC = rpc.importAPI('posts', postsManifest, opts)
     const followgraphRPC = rpc.importAPI('followgraph', followgraphManifest, opts)
 
+    // beaker.logger
+    beaker.logger = {}
+    beaker.logger.stream = loggerRPC.stream
+    beaker.logger.query = loggerRPC.query
+
     // beaker.archives
     beaker.archives = new EventTarget()
     beaker.archives.status = archivesRPC.status
diff --git a/web-apis/manifests/internal/logger.js b/web-apis/manifests/internal/logger.js
new file mode 100644
index 00000000..fb8d5c9e
--- /dev/null
+++ b/web-apis/manifests/internal/logger.js
@@ -0,0 +1,4 @@
+module.exports = {
+  stream: 'readable',
+  query: 'promise'
+}
\ No newline at end of file

From 78a1e7d19941852e04b0fa301bf804477026dd06 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 20 Jan 2019 18:36:40 -0600
Subject: [PATCH 069/245] Fixes to the logfile query and add log rotation

---
 crawler/posts.js             |   4 +-
 crawler/site-descriptions.js |   4 +-
 index.js                     |   2 +-
 logger.js                    | 138 ++++++++++++++++++++++++++++-------
 4 files changed, 116 insertions(+), 32 deletions(-)

diff --git a/crawler/posts.js b/crawler/posts.js
index 5e66c3ae..034b7f5c 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -83,7 +83,7 @@ exports.crawlSite = async function (archive, crawlSource) {
         `, [crawlSource.id, changedPost.name])
         events.emit('post-removed', archive.url)
       } else {
-        // read 
+        // read
         let postString
         try {
           postString = await archive.pda.readFile(changedPost.name, 'utf8')
@@ -91,7 +91,7 @@ exports.crawlSite = async function (archive, crawlSource) {
           logger.warn('Failed to read post file, aborting', {url: archive.url, name: changedPost.name, err})
           return // abort indexing
         }
-        
+
         // parse and validate
         let post
         try {
diff --git a/crawler/site-descriptions.js b/crawler/site-descriptions.js
index 9bccd271..13bd87d8 100644
--- a/crawler/site-descriptions.js
+++ b/crawler/site-descriptions.js
@@ -95,7 +95,7 @@ exports.crawlSite = async function (archive, crawlSource) {
         `, [crawlSource.id, url])
         events.emit('description-removed', archive.url)
       } else {
-        // read 
+        // read
         let descString
         try {
           descString = await archive.pda.readFile(changedSiteDescription.name, 'utf8')
@@ -103,7 +103,7 @@ exports.crawlSite = async function (archive, crawlSource) {
           logger.warn('Failed to read dat.json file, aborting', {url: archive.url, name: changedSiteDescription.name, err})
           return // abort indexing
         }
-        
+
         // parse and validate
         let desc
         try {
diff --git a/index.js b/index.js
index 8ea92bc5..8807b576 100644
--- a/index.js
+++ b/index.js
@@ -43,7 +43,7 @@ module.exports = {
     }
 
     // initiate log
-    logger.setup(join(opts.userDataPath, 'beaker.log'))
+    await logger.setup(join(opts.userDataPath, 'beaker.log'))
     debugLogger.setup(join(opts.userDataPath, 'debug.log'))
 
     // setup databases
diff --git a/logger.js b/logger.js
index 130966a9..6bf69c04 100644
--- a/logger.js
+++ b/logger.js
@@ -1,6 +1,9 @@
 const winston = require('winston')
+const fs = require('fs')
+const jetpack = require('fs-jetpack')
 const concat = require('concat-stream')
 const pump = require('pump')
+const split2 = require('split2')
 const through2 = require('through2')
 const {combine, timestamp, json, simple, colorize, padLevels} = winston.format
 
@@ -9,16 +12,18 @@ const {combine, timestamp, json, simple, colorize, padLevels} = winston.format
 
 /**
  * @typedef {Object} LogStreamOpts
- * @prop {number} [from] - Start time
- * @prop {number} [to] - End time
+ * @prop {number} [logFile = 0] - Which logfile to read
+ * @prop {number} [since] - Start time
+ * @prop {number} [until] - End time
  * @prop {number} [offset] - Event-slice offset
  * @prop {number} [limit] - Max number of objects to output
- * @prop {any} [filters] - Attribute filters
+ * @prop {any} [filter] - Attribute filters
  */
 
 // globals
 // =
 
+var logPath
 const logger = winston.createLogger({
   level: 'silly'
 })
@@ -26,12 +31,20 @@ const logger = winston.createLogger({
 // exported api
 // =
 
-exports.setup = function (logPath) {
+exports.setup = async function (p) {
+  logPath = p
+
+  // rotate logfiles from previous runs
+  await retireLogFile(5)
+  for (let i = 4; i >= 0; i--) {
+    await rotateLogFile(i)
+  }
+
   logger.add(new winston.transports.File({
     filename: logPath,
     format: combine(timestamp(), json())
   }))
-  
+
   // TODO if debug (pick an env var for this)
   logger.add(new winston.transports.Console({
     level: 'debug',
@@ -50,11 +63,45 @@ exports.child = (arg) => logger.child(arg)
  * @param {LogStreamOpts} [opts]
  * @returns {Promise<Object[]>}
  */
-exports.query = async (opts) => {
+const query = exports.query = async (opts = {}) => {
   return new Promise((resolve, reject) => {
-    pump(
-      stream(opts),
-      concat({encoding: 'object'}, objs => resolve(/** @type any */(objs))),
+    var beforeOffset = 0
+    var beforeLimit = 0
+    var offset = opts.offset || 0
+    var limit = opts.limit || 100
+    var filter = massageFilters(opts.filter)
+    var readStream = fs.createReadStream(getLogPath(opts.logFile || 0), {encoding: 'utf8'})
+    return pump(
+      readStream,
+      split2(),
+      through2.obj(function (row, enc, cb) {
+        // offset filter
+        if (beforeOffset < offset) {
+          beforeOffset++
+          return cb()
+        }
+
+        // parse
+        row = JSON.parse(row)
+
+        // timestamp range filter
+        var ts = (opts.since || opts.until) ? (new Date(row.timestamp)).getTime() : null
+        if ('since' in opts && ts < opts.since) return cb()
+        if ('until' in opts && ts > opts.until) return cb()
+
+        // general string filters
+        if (filter) {
+          for (let k in filter) {
+            if (!filter[k].includes(row[k])) return cb()
+          }
+        }
+
+        // emit
+        if (beforeLimit < limit) this.push(row)
+        if (++beforeLimit === limit) readStream.destroy()
+        cb()
+      }),
+      concat({encoding: 'object'}, res => resolve(/** @type any */(res))),
       reject
     )
   })
@@ -67,28 +114,65 @@ exports.query = async (opts) => {
  */
 const stream = exports.stream = (opts = {}) => {
   var n = 0
-
-  var filters = opts.filters
-  if (filters && typeof filters === 'object') {
-    // make each filter an array
-    for (let k in filters) {
-      filters[k] = Array.isArray(filters[k]) ? filters[k] : [filters[k]]
-    }
-  } else {
-    filters = false
-  }
-
+  var filter = massageFilters(opts.filter)
   var logStream = logger.stream({start: opts.offset || undefined})
-  return logStream.pipe(through2.obj((row, enc, cb) => {
-      var ts = (opts.from || opts.to) ? (new Date(row.timestamp)).getTime() : null
-      if ('from' in opts && ts < opts.from) return cb()
-      if ('to' in opts && ts > opts.to) return cb()
-      if (filters) {
-        for (let k in filters) {
-          if (!filters[k].includes(row[k])) return cb()
+  return logStream.pipe(through2.obj(function (row, enc, cb) {
+      var ts = (opts.since || opts.until) ? (new Date(row.timestamp)).getTime() : null
+      if ('since' in opts && ts < opts.since) return cb()
+      if ('until' in opts && ts > opts.until) return cb()
+      if (filter) {
+        for (let k in filter) {
+          if (!filter[k].includes(row[k])) return cb()
         }
       }
       this.push(row)
       if (opts.limit && ++n >= opts.limit) logStream.destroy()
+      cb()
     }))
 }
+
+exports.WEBAPI = {stream, query}
+
+// internal methods
+// =
+
+function massageFilters (filter) {
+  if (filter && typeof filter === 'object') {
+    // make each filter an array
+    for (let k in filter) {
+      filter[k] = Array.isArray(filter[k]) ? filter[k] : [filter[k]]
+    }
+  } else {
+    filter = false
+  }
+  return filter
+}
+
+function getLogPath (num) {
+  if (num) return logPath + '.' + num
+  return logPath
+}
+
+async function rotateLogFile (num) {
+  try {
+    var p = getLogPath(num)
+    var info = await jetpack.inspectAsync(p)
+    if (info && info.type === 'file') {
+      await jetpack.moveAsync(p, getLogPath(num + 1))
+    }
+  } catch (err) {
+    console.error('rotateLogFile failed', num, err)
+  }
+}
+
+async function retireLogFile (num) {
+  try {
+    var p = getLogPath(num)
+    var info = await jetpack.inspectAsync(p)
+    if (info && info.type === 'file') {
+      await jetpack.removeAsync(p)
+    }
+  } catch (err) {
+    console.error('retireLogFile failed', num, err)
+  }
+}
\ No newline at end of file

From 430762ba7a135374de2f5120fdd2bdd7fb795c5d Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 20 Jan 2019 19:22:50 -0600
Subject: [PATCH 070/245] Implement beaker.logger.stream

---
 lib/tail-file.js      |  88 +++++++++++++++++++++++++++++
 logger.js             | 125 ++++++++++++++++++++++++------------------
 web-apis/fg/beaker.js |   2 +-
 3 files changed, 162 insertions(+), 53 deletions(-)
 create mode 100644 lib/tail-file.js

diff --git a/lib/tail-file.js b/lib/tail-file.js
new file mode 100644
index 00000000..93ada643
--- /dev/null
+++ b/lib/tail-file.js
@@ -0,0 +1,88 @@
+/**
+ * tail-file.js: TODO: add file header description.
+ *
+ * (C) 2010 Charlie Robbins
+ * (C) 2019 Paul Frazee
+ * MIT LICENCE
+ */
+
+'use strict';
+
+const fs = require('fs');
+const { StringDecoder } = require('string_decoder');
+const { Stream } = require('readable-stream');
+
+/**
+ * Simple no-op function.
+ * @returns {undefined}
+ */
+function noop() {}
+
+/**
+ * Read and then tail the given file.
+ * The algorithm is fairly straight-forward: after hitting the end, it will attempt reads once a second.
+ * (It's poll-based rather than watch-based.)
+ * @param {string} file - Path to file.
+ * @returns {any} - TODO: add return description.
+ */
+module.exports = (file) => {
+  const buffer = Buffer.alloc(64 * 1024);
+  const decode = new StringDecoder('utf8');
+  const stream = new Stream();
+  let pos = 0;
+
+  stream.readable = true;
+  stream.destroy = () => {
+    stream.destroyed = true;
+    stream.emit('end');
+    stream.emit('close');
+  };
+
+  fs.open(file, 'a+', '0644', async (err, fd) => {
+    if (err) {
+      stream.emit('error', err);
+      stream.destroy();
+      return;
+    }
+
+    while (true) {
+      if (stream.destroyed) {
+        // abort if stream destroyed
+        fs.close(fd, noop);
+        return;
+      }
+
+      // read next chunk
+      let bytes
+      try {
+        console.log('reading', {pos})
+        bytes = await new Promise((resolve, reject) => {
+          fs.read(fd, buffer, 0, buffer.length, pos, (err, bytes) => {
+            if (err) reject(err)
+            else resolve(bytes)
+          })
+        })
+        console.log('read', {bytes})
+      } catch (err) {
+        stream.emit('error', err);
+        stream.destroy();
+        return;
+      }
+
+      if (!bytes) {
+        // nothing read
+        // wait a second, then try to read again
+        await new Promise(resolve => setTimeout(resolve, 1e3))
+        continue
+      }
+
+      // decode and emit
+      let data = decode.write(buffer.slice(0, bytes));
+      console.log('emitting', data)
+      stream.emit('data', data);
+      pos += bytes;
+    }
+  })
+
+  return stream;
+};
diff --git a/logger.js b/logger.js
index 6bf69c04..3e5da4e6 100644
--- a/logger.js
+++ b/logger.js
@@ -5,7 +5,9 @@ const concat = require('concat-stream')
 const pump = require('pump')
 const split2 = require('split2')
 const through2 = require('through2')
+const {Readable} = require('stream')
 const {combine, timestamp, json, simple, colorize, padLevels} = winston.format
+const tailFile = require('./lib/tail-file')
 
 // typedefs
 // =
@@ -65,42 +67,10 @@ exports.child = (arg) => logger.child(arg)
  */
 const query = exports.query = async (opts = {}) => {
   return new Promise((resolve, reject) => {
-    var beforeOffset = 0
-    var beforeLimit = 0
-    var offset = opts.offset || 0
-    var limit = opts.limit || 100
-    var filter = massageFilters(opts.filter)
+    opts.limit = opts.limit || 100
     var readStream = fs.createReadStream(getLogPath(opts.logFile || 0), {encoding: 'utf8'})
-    return pump(
-      readStream,
-      split2(),
-      through2.obj(function (row, enc, cb) {
-        // offset filter
-        if (beforeOffset < offset) {
-          beforeOffset++
-          return cb()
-        }
-
-        // parse
-        row = JSON.parse(row)
-
-        // timestamp range filter
-        var ts = (opts.since || opts.until) ? (new Date(row.timestamp)).getTime() : null
-        if ('since' in opts && ts < opts.since) return cb()
-        if ('until' in opts && ts > opts.until) return cb()
-
-        // general string filters
-        if (filter) {
-          for (let k in filter) {
-            if (!filter[k].includes(row[k])) return cb()
-          }
-        }
-
-        // emit
-        if (beforeLimit < limit) this.push(row)
-        if (++beforeLimit === limit) readStream.destroy()
-        cb()
-      }),
+    pump(
+      readPipeline(readStream, opts),
       concat({encoding: 'object'}, res => resolve(/** @type any */(res))),
       reject
     )
@@ -113,25 +83,32 @@ const query = exports.query = async (opts = {}) => {
  * @returns {NodeJS.ReadStream}
  */
 const stream = exports.stream = (opts = {}) => {
-  var n = 0
-  var filter = massageFilters(opts.filter)
-  var logStream = logger.stream({start: opts.offset || undefined})
-  return logStream.pipe(through2.obj(function (row, enc, cb) {
-      var ts = (opts.since || opts.until) ? (new Date(row.timestamp)).getTime() : null
-      if ('since' in opts && ts < opts.since) return cb()
-      if ('until' in opts && ts > opts.until) return cb()
-      if (filter) {
-        for (let k in filter) {
-          if (!filter[k].includes(row[k])) return cb()
-        }
-      }
-      this.push(row)
-      if (opts.limit && ++n >= opts.limit) logStream.destroy()
-      cb()
-    }))
+  var readStream = tailFile(getLogPath(opts.logFile || 0))
+  return readPipeline(readStream, opts)
 }
 
-exports.WEBAPI = {stream, query}
+exports.WEBAPI = {
+  query,
+  stream: opts => {
+    opts = opts || {}
+    var s2 = new Readable({
+      read() {},
+      objectMode: true
+    })
+    var s1 = stream(opts)
+    // convert to the emit-stream form
+    s1.on('data', v => {
+      s2.push(['data', v])
+    })
+    s1.on('error', v => s2.push(['error', v]))
+    s1.on('close', v => {
+      s2.push(['close', v])
+      s2.destroy()
+    })
+    s2.on('close', () => s1.destroy())
+    return s2
+  }
+}
 
 // internal methods
 // =
@@ -175,4 +152,48 @@ async function retireLogFile (num) {
   } catch (err) {
     console.error('retireLogFile failed', num, err)
   }
+}
+
+/**
+ * @param {any} readStream 
+ * @param {LogStreamOpts} opts 
+ * @returns {any}
+ */
+function readPipeline (readStream, opts) {
+  var beforeOffset = 0
+  var beforeLimit = 0
+  var offset = opts.offset || 0
+  var limit = opts.limit
+  var filter = massageFilters(opts.filter)
+  return pump(
+    readStream,
+    split2(),
+    through2.obj(function (row, enc, cb) {
+      // offset filter
+      if (beforeOffset < offset) {
+        beforeOffset++
+        return cb()
+      }
+
+      // parse
+      row = JSON.parse(row)
+
+      // timestamp range filter
+      var ts = (opts.since || opts.until) ? (new Date(row.timestamp)).getTime() : null
+      if ('since' in opts && ts < opts.since) return cb()
+      if ('until' in opts && ts > opts.until) return cb()
+
+      // general string filters
+      if (filter) {
+        for (let k in filter) {
+          if (!filter[k].includes(row[k])) return cb()
+        }
+      }
+
+      // emit
+      if (!limit || beforeLimit < limit) this.push(row)
+      if (limit && ++beforeLimit === limit) readStream.destroy()
+      cb()
+    })
+  )
 }
\ No newline at end of file
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index f6fc92b7..d1c9a5a2 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -35,7 +35,7 @@ exports.setup = function (rpc) {
 
     // beaker.logger
     beaker.logger = {}
-    beaker.logger.stream = loggerRPC.stream
+    beaker.logger.stream = (opts) => fromEventStream(loggerRPC.stream(opts))
     beaker.logger.query = loggerRPC.query
 
     // beaker.archives

From ab3d7c0d3b1a76f6e1edd7e1882f356dd7c6ff16 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 21 Jan 2019 11:41:50 -0600
Subject: [PATCH 071/245] Add sort option to logger query

---
 logger.js         | 29 +++++++++++++++++++----------
 package-lock.json | 13 +++++++++++++
 package.json      |  1 +
 3 files changed, 33 insertions(+), 10 deletions(-)

diff --git a/logger.js b/logger.js
index 3e5da4e6..e7308619 100644
--- a/logger.js
+++ b/logger.js
@@ -1,6 +1,7 @@
 const winston = require('winston')
 const fs = require('fs')
 const jetpack = require('fs-jetpack')
+const fsReverse = require('fs-reverse')
 const concat = require('concat-stream')
 const pump = require('pump')
 const split2 = require('split2')
@@ -13,8 +14,9 @@ const tailFile = require('./lib/tail-file')
 // =
 
 /**
- * @typedef {Object} LogStreamOpts
+ * @typedef {Object} LogQueryOpts
  * @prop {number} [logFile = 0] - Which logfile to read
+ * @prop {string} [sort = 'asc'] - Sort direction
  * @prop {number} [since] - Start time
  * @prop {number} [until] - End time
  * @prop {number} [offset] - Event-slice offset
@@ -62,15 +64,17 @@ exports.child = (arg) => logger.child(arg)
 
 /**
  * Query a slice of the log.
- * @param {LogStreamOpts} [opts]
+ * @param {LogQueryOpts} [opts]
  * @returns {Promise<Object[]>}
  */
 const query = exports.query = async (opts = {}) => {
   return new Promise((resolve, reject) => {
     opts.limit = opts.limit || 100
-    var readStream = fs.createReadStream(getLogPath(opts.logFile || 0), {encoding: 'utf8'})
+    var readFn = opts.sort === 'desc' ? fsReverse : fs.createReadStream
+    var readStream = readFn(getLogPath(opts.logFile || 0), {encoding: 'utf8'})
+    const nosplit = (readFn === fsReverse) // fs-reverse splits for us
     pump(
-      readPipeline(readStream, opts),
+      readPipeline(readStream, opts, nosplit),
       concat({encoding: 'object'}, res => resolve(/** @type any */(res))),
       reject
     )
@@ -79,7 +83,7 @@ const query = exports.query = async (opts = {}) => {
 
 /**
  * Create a read stream of the log.
- * @param {LogStreamOpts} [opts]
+ * @param {LogQueryOpts} [opts]
  * @returns {NodeJS.ReadStream}
  */
 const stream = exports.stream = (opts = {}) => {
@@ -156,19 +160,24 @@ async function retireLogFile (num) {
 
 /**
  * @param {any} readStream 
- * @param {LogStreamOpts} opts 
+ * @param {LogQueryOpts} opts 
  * @returns {any}
  */
-function readPipeline (readStream, opts) {
+function readPipeline (readStream, opts, nosplit = false) {
   var beforeOffset = 0
   var beforeLimit = 0
   var offset = opts.offset || 0
   var limit = opts.limit
   var filter = massageFilters(opts.filter)
-  return pump(
+  return pump([
     readStream,
-    split2(),
+    nosplit ? undefined : split2(),
     through2.obj(function (row, enc, cb) {
+      if (!row || !row.trim()) {
+        // skip empty
+        return cb()
+      }
+
       // offset filter
       if (beforeOffset < offset) {
         beforeOffset++
@@ -195,5 +204,5 @@ function readPipeline (readStream, opts) {
       if (limit && ++beforeLimit === limit) readStream.destroy()
       cb()
     })
-  )
+  ].filter(Boolean))
 }
\ No newline at end of file
diff --git a/package-lock.json b/package-lock.json
index acedad44..8e7ae10f 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -1582,6 +1582,11 @@
         "map-cache": "^0.2.2"
       }
     },
+    "from": {
+      "version": "0.1.7",
+      "resolved": "https://registry.npmjs.org/from/-/from-0.1.7.tgz",
+      "integrity": "sha1-g8YK/Fi5xWmXAH7Rp2izqzA6RP4="
+    },
     "from2": {
       "version": "2.3.0",
       "resolved": "https://registry.npmjs.org/from2/-/from2-2.3.0.tgz",
@@ -1617,6 +1622,14 @@
         "minipass": "^2.2.1"
       }
     },
+    "fs-reverse": {
+      "version": "0.0.3",
+      "resolved": "https://registry.npmjs.org/fs-reverse/-/fs-reverse-0.0.3.tgz",
+      "integrity": "sha512-zu+5yhmaWueDBAWm7y6ejj2PipVep3EQlQYdfS6r3zsfzIfTVkcdbrsqye2UovisDqogu5dJFxae/dUAOYQqBA==",
+      "requires": {
+        "from": "~0.1"
+      }
+    },
     "fs.realpath": {
       "version": "1.0.0",
       "resolved": "https://registry.npmjs.org/fs.realpath/-/fs.realpath-1.0.0.tgz",
diff --git a/package.json b/package.json
index 24257ada..d77089ee 100644
--- a/package.json
+++ b/package.json
@@ -43,6 +43,7 @@
     "discovery-swarm": "^5.1.3",
     "emit-stream": "^0.1.2",
     "fs-jetpack": "^1.3.1",
+    "fs-reverse": "0.0.3",
     "function-queue": "0.0.12",
     "hypercore-protocol": "^6.9.0",
     "hyperdrive": "^9.14.0",

From 3fe93d22e815a7745d150bc59eabdd6bbbf81508 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 21 Jan 2019 12:11:42 -0600
Subject: [PATCH 072/245] Cleanup

---
 lib/tail-file.js | 57 +++++++++++++++++++++++-------------------------
 logger.js        |  6 ++---
 2 files changed, 30 insertions(+), 33 deletions(-)

diff --git a/lib/tail-file.js b/lib/tail-file.js
index 93ada643..0ecc7be0 100644
--- a/lib/tail-file.js
+++ b/lib/tail-file.js
@@ -6,17 +6,17 @@
  * MIT LICENCE
  */
 
-'use strict';
+'use strict'
 
-const fs = require('fs');
-const { StringDecoder } = require('string_decoder');
-const { Stream } = require('readable-stream');
+const fs = require('fs')
+const { StringDecoder } = require('string_decoder')
+const { Stream } = require('readable-stream')
 
 /**
  * Simple no-op function.
  * @returns {undefined}
  */
-function noop() {}
+function noop () {}
 
 /**
  * Read and then tail the given file.
@@ -26,47 +26,45 @@ function noop() {}
  * @returns {any} - TODO: add return description.
  */
 module.exports = (file) => {
-  const buffer = Buffer.alloc(64 * 1024);
-  const decode = new StringDecoder('utf8');
-  const stream = new Stream();
-  let pos = 0;
+  const buffer = Buffer.alloc(64 * 1024)
+  const decode = new StringDecoder('utf8')
+  const stream = new Stream()
+  let pos = 0
 
-  stream.readable = true;
+  stream.readable = true
   stream.destroy = () => {
-    stream.destroyed = true;
-    stream.emit('end');
-    stream.emit('close');
-  };
+    stream.destroyed = true
+    stream.emit('end')
+    stream.emit('close')
+  }
 
   fs.open(file, 'a+', '0644', async (err, fd) => {
     if (err) {
-      stream.emit('error', err);
-      stream.destroy();
-      return;
+      stream.emit('error', err)
+      stream.destroy()
+      return
     }
 
     while (true) {
       if (stream.destroyed) {
         // abort if stream destroyed
-        fs.close(fd, noop);
-        return;
+        fs.close(fd, noop)
+        return
       }
 
       // read next chunk
       let bytes
       try {
-        console.log('reading', {pos})
         bytes = await new Promise((resolve, reject) => {
           fs.read(fd, buffer, 0, buffer.length, pos, (err, bytes) => {
             if (err) reject(err)
             else resolve(bytes)
           })
         })
-        console.log('read', {bytes})
       } catch (err) {
-        stream.emit('error', err);
-        stream.destroy();
-        return;
+        stream.emit('error', err)
+        stream.destroy()
+        return
       }
 
       if (!bytes) {
@@ -77,12 +75,11 @@ module.exports = (file) => {
       }
 
       // decode and emit
-      let data = decode.write(buffer.slice(0, bytes));
-      console.log('emitting', data)
-      stream.emit('data', data);
-      pos += bytes;
+      let data = decode.write(buffer.slice(0, bytes))
+      stream.emit('data', data)
+      pos += bytes
     }
   })
 
-  return stream;
-};
+  return stream
+}
diff --git a/logger.js b/logger.js
index e7308619..4f17224f 100644
--- a/logger.js
+++ b/logger.js
@@ -96,7 +96,7 @@ exports.WEBAPI = {
   stream: opts => {
     opts = opts || {}
     var s2 = new Readable({
-      read() {},
+      read () {},
       objectMode: true
     })
     var s1 = stream(opts)
@@ -159,8 +159,8 @@ async function retireLogFile (num) {
 }
 
 /**
- * @param {any} readStream 
- * @param {LogQueryOpts} opts 
+ * @param {any} readStream
+ * @param {LogQueryOpts} opts
  * @returns {any}
  */
 function readPipeline (readStream, opts, nosplit = false) {

From e0e6a00df056cb7d02fc14ea62c12eadc7921ab4 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 21 Jan 2019 13:27:17 -0600
Subject: [PATCH 073/245] Refine the logging statements

---
 crawler/followgraph.js       | 18 +++++++++---------
 crawler/index.js             |  9 ++++-----
 crawler/posts.js             | 16 ++++++++++------
 crawler/published-sites.js   | 18 +++++++++---------
 crawler/site-descriptions.js | 20 ++++++++++++--------
 dat/garbage-collector.js     |  4 ++++
 dat/library.js               |  3 ++-
 logger.js                    |  2 +-
 users/index.js               | 11 ++++++-----
 9 files changed, 57 insertions(+), 44 deletions(-)

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index 420201a7..433d17df 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -48,10 +48,10 @@ exports.removeListener = events.removeListener.bind(events)
 exports.crawlSite = async function (archive, crawlSource) {
   return doCrawl(archive, crawlSource, 'crawl_followgraph', TABLE_VERSION, async ({changes, resetRequired}) => {
     const supressEvents = resetRequired === true // dont emit when replaying old info
-    logger.silly('Crawling follows', {url: archive.url, numChanges: changes.length, resetRequired})
+    logger.silly('Crawling follows', {details: {url: archive.url, numChanges: changes.length, resetRequired}})
     if (resetRequired) {
       // reset all data
-      logger.silly('Resetting dataset', {url: archive.url})
+      logger.debug('Resetting dataset', {details: {url: archive.url}})
       await db.run(`
         DELETE FROM crawl_followgraph WHERE crawlSourceId = ?
       `, [crawlSource.id])
@@ -61,21 +61,21 @@ exports.crawlSite = async function (archive, crawlSource) {
     // did follows.json change?
     var change = changes.find(c => c.name === JSON_PATH)
     if (!change) {
-      logger.silly('No change detected to follows record, aborting', {url: archive.url})
+      logger.debug('No change detected to follows record', {details: {url: archive.url}})
       if (changes.length) {
         await doCheckpoint('crawl_followgraph', TABLE_VERSION, crawlSource, changes[changes.length - 1].version)
       }
       return
     }
 
-    logger.silly('Change detected to follows record', {url: archive.url})
+    logger.debug('Change detected to follows record', {details: {url: archive.url}})
     emitProgressEvent(archive.url, 'crawl_followgraph', 0, 1)
 
     // read and validate
     try {
       var followsJson = await readFollowsFile(archive)
     } catch (err) {
-      logger.warn('Failed to read follows file', {url: archive.url, err})
+      logger.warn('Failed to read follows file', {details: {url: archive.url, err}})
       return
     }
 
@@ -84,7 +84,7 @@ exports.crawlSite = async function (archive, crawlSource) {
     var newFollows = followsJson.urls
     var adds = _difference(newFollows, currentFollows)
     var removes = _difference(currentFollows, newFollows)
-    logger.silly(`Adding ${adds.length} follows and removing ${removes.length} follows`, {url: archive.url})
+    logger.silly(`Adding ${adds.length} follows and removing ${removes.length} follows`, {details: {url: archive.url}})
 
     // write updates
     for (let add of adds) {
@@ -96,7 +96,7 @@ exports.crawlSite = async function (archive, crawlSource) {
         if (e.code === 'SQLITE_CONSTRAINT') {
           // uniqueness constraint probably failed, which means we got a duplicate somehow
           // dont worry about it
-          logger.warn('Attempted to insert duplicate followgraph record', {url: archive.url, add})
+          logger.warn('Attempted to insert duplicate followgraph record', {details: {url: archive.url, add}})
         } else {
           throw e
         }
@@ -115,7 +115,7 @@ exports.crawlSite = async function (archive, crawlSource) {
     }
 
     // write checkpoint as success
-    logger.silly(`Finished crawling follows`, {url: archive.url})
+    logger.silly(`Finished crawling follows`, {details: {url: archive.url}})
     await doCheckpoint('crawl_followgraph', TABLE_VERSION, crawlSource, changes[changes.length - 1].version)
     emitProgressEvent(archive.url, 'crawl_followgraph', 1, 1)
   })
@@ -357,7 +357,7 @@ async function updateFollowsFile (archive, updateFn) {
           urls: []
         }
       } else {
-        logger.warn('Failed to read follows file', {url: archive.url, err})
+        logger.warn('Failed to read follows file', {details: {url: archive.url, err}})
         throw err
       }
     }
diff --git a/crawler/index.js b/crawler/index.js
index 5755f8d0..1bfb0446 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -27,7 +27,7 @@ exports.siteDescriptions = siteDescriptions
 const createEventsStream = exports.createEventsStream = () => emitStream(crawlerEvents)
 
 exports.setup = async function () {
-  logger.verbose('Crawler initialized')
+  logger.info('Initialized crawler')
 }
 
 exports.watchSite = async function (archive) {
@@ -67,7 +67,7 @@ exports.unwatchSite = async function (url) {
 
 const crawlSite =
 exports.crawlSite = async function (archive) {
-  logger.silly('Crawling site', {url: archive.url})
+  logger.silly('Crawling site', {details: {url: archive.url}})
   crawlerEvents.emit('crawl-start', {sourceUrl: archive.url})
   var release = await lock('crawl:' + archive.url)
   try {
@@ -86,10 +86,9 @@ exports.crawlSite = async function (archive) {
       siteDescriptions.crawlSite(archive, crawlSource)
     ])
   } catch (err) {
-    logger.error('Failed to crawl site', {sourceUrl: archive.url, err: err.toString()})
+    logger.error('Failed to crawl site', {details: {url: archive.url, err: err.toString()}})
     crawlerEvents.emit('crawl-error', {sourceUrl: archive.url, err: err.toString()})
   } finally {
-    logger.silly('Finished crawling site', {url: archive.url})
     crawlerEvents.emit('crawl-finish', {sourceUrl: archive.url})
     release()
   }
@@ -121,7 +120,7 @@ exports.getCrawlStates = async function () {
 
 const resetSite =
 exports.resetSite = async function (url) {
-  logger.silly('Resetting site', {url})
+  logger.debug('Resetting site', {details: {url}})
   await db.run(`DELETE FROM crawl_sources WHERE url = ?`, [url])
 }
 
diff --git a/crawler/posts.js b/crawler/posts.js
index 034b7f5c..469c4f08 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -54,10 +54,10 @@ exports.removeListener = events.removeListener.bind(events)
 exports.crawlSite = async function (archive, crawlSource) {
   return doCrawl(archive, crawlSource, 'crawl_posts', TABLE_VERSION, async ({changes, resetRequired}) => {
     const supressEvents = resetRequired === true // dont emit when replaying old info
-    logger.silly('Crawling posts', {url: archive.url, numChanges: changes.length, resetRequired})
+    logger.silly('Crawling posts', {details: {url: archive.url, numChanges: changes.length, resetRequired}})
     if (resetRequired) {
       // reset all data
-      logger.silly('Resetting dataset', {url: archive.url})
+      logger.debug('Resetting dataset', {details: {url: archive.url}})
       await db.run(`
         DELETE FROM crawl_posts WHERE crawlSourceId = ?
       `, [crawlSource.id])
@@ -66,7 +66,11 @@ exports.crawlSite = async function (archive, crawlSource) {
 
     // collect changed posts
     var changedPosts = getMatchingChangesInOrder(changes, JSON_PATH_REGEX)
-    logger.silly('Collected changed posts', {changedPosts: changedPosts.map(p => p.name)})
+    if (changedPosts.length) {
+      logger.debug('Collected new/changed post files', {details: {url: archive.url, changedPosts: changedPosts.map(p => p.name)}})
+    } else {
+      logger.debug('No new post-files found', {details: {url: archive.url}})
+    }
     emitProgressEvent(archive.url, 'crawl_posts', 0, changedPosts.length)
 
     // read and apply each post in order
@@ -88,7 +92,7 @@ exports.crawlSite = async function (archive, crawlSource) {
         try {
           postString = await archive.pda.readFile(changedPost.name, 'utf8')
         } catch (err) {
-          logger.warn('Failed to read post file, aborting', {url: archive.url, name: changedPost.name, err})
+          logger.warn('Failed to read post file, aborting', {details: {url: archive.url, name: changedPost.name, err}})
           return // abort indexing
         }
 
@@ -102,7 +106,7 @@ exports.crawlSite = async function (archive, crawlSource) {
           assert(typeof post.createdAt === 'string', 'JSON createdAt must be a date-time')
           assert(!isNaN(Number(new Date(post.createdAt))), 'JSON createdAt must be a date-time')
         } catch (err) {
-          logger.warn('Failed to parse post file, skipping', {url: archive.url, name: changedPost.name, err})
+          logger.warn('Failed to parse post file, skipping', {details: {url: archive.url, name: changedPost.name, err}})
           continue // skip
         }
 
@@ -130,7 +134,7 @@ exports.crawlSite = async function (archive, crawlSource) {
       }
 
       // checkpoint our progress
-      logger.silly(`Finished crawling posts`, {url: archive.url})
+      logger.silly(`Finished crawling posts`, {details: {url: archive.url}})
       await doCheckpoint('crawl_posts', TABLE_VERSION, crawlSource, changedPost.version)
       emitProgressEvent(archive.url, 'crawl_posts', ++progress, changedPosts.length)
     }
diff --git a/crawler/published-sites.js b/crawler/published-sites.js
index 143bfa80..dc88285d 100644
--- a/crawler/published-sites.js
+++ b/crawler/published-sites.js
@@ -52,10 +52,10 @@ exports.removeListener = events.removeListener.bind(events)
 exports.crawlSite = async function (archive, crawlSource) {
   return doCrawl(archive, crawlSource, 'crawl_published_sites', TABLE_VERSION, async ({changes, resetRequired}) => {
     const supressEvents = resetRequired === true // dont emit when replaying old info
-    logger.silly('Crawling published sites', {url: archive.url, numChanges: changes.length, resetRequired})
+    logger.silly('Crawling published sites', {details: {url: archive.url, numChanges: changes.length, resetRequired}})
     if (resetRequired) {
       // reset all data
-      logger.silly('Resetting dataset', {url: archive.url})
+      logger.debug('Resetting dataset', {details: {url: archive.url}})
       await db.run(`
         DELETE FROM crawl_published_sites WHERE crawlSourceId = ?
       `, [crawlSource.id])
@@ -65,21 +65,21 @@ exports.crawlSite = async function (archive, crawlSource) {
     // did sites.json change?
     var change = changes.find(c => c.name === JSON_PATH)
     if (!change) {
-      logger.silly('No change detected to published-sites record, aborting', {url: archive.url})
+      logger.debug('No change detected to published-sites record', {details: {url: archive.url}})
       if (changes.length) {
         await doCheckpoint('crawl_published_sites', TABLE_VERSION, crawlSource, changes[changes.length - 1].version)
       }
       return
     }
 
-    logger.silly('Change detected to published-sites record', {url: archive.url})
+    logger.debug('Change detected to published-sites record', {details: {url: archive.url}})
     emitProgressEvent(archive.url, 'crawl_published_sites', 0, 1)
 
     // read and validate
     try {
       var sitesJson = await readSitesFile(archive)
     } catch (err) {
-      logger.warn('Failed to read published-sites file', {url: archive.url, err})
+      logger.warn('Failed to read published-sites file', {details: {url: archive.url, err}})
       return
     }
 
@@ -88,7 +88,7 @@ exports.crawlSite = async function (archive, crawlSource) {
     var newSites = sitesJson.urls
     var adds = _difference(newSites, currentPublishedSites)
     var removes = _difference(currentPublishedSites, newSites)
-    logger.silly(`Adding ${adds.length} sites and removing ${removes.length} sites`, {url: archive.url})
+    logger.silly(`Adding ${adds.length} sites and removing ${removes.length} sites`, {details: {url: archive.url}})
 
     // write updates
     for (let add of adds) {
@@ -100,7 +100,7 @@ exports.crawlSite = async function (archive, crawlSource) {
         if (e.code === 'SQLITE_CONSTRAINT') {
           // uniqueness constraint probably failed, which means we got a duplicate somehow
           // dont worry about it
-          logger.warn('Attempted to insert duplicate published-site record', {url: archive.url, add})
+          logger.warn('Attempted to insert duplicate published-site record', {details: {url: archive.url, add}})
         } else {
           throw e
         }
@@ -119,7 +119,7 @@ exports.crawlSite = async function (archive, crawlSource) {
     }
 
     // write checkpoint as success
-    logger.silly(`Finished crawling published sites`, {url: archive.url})
+    logger.silly(`Finished crawling published sites`, {details: {url: archive.url}})
     await doCheckpoint('crawl_published_sites', TABLE_VERSION, crawlSource, changes[changes.length - 1].version)
     emitProgressEvent(archive.url, 'crawl_published_sites', 1, 1)
   })
@@ -281,7 +281,7 @@ async function updateSitesFile (archive, updateFn) {
           urls: []
         }
       } else {
-        logger.warn('Failed to read published-sites file', {url: archive.url, err})
+        logger.warn('Failed to read published-sites file', {details: {url: archive.url, err}})
         throw err
       }
     }
diff --git a/crawler/site-descriptions.js b/crawler/site-descriptions.js
index 13bd87d8..061b03f1 100644
--- a/crawler/site-descriptions.js
+++ b/crawler/site-descriptions.js
@@ -62,10 +62,10 @@ exports.removeListener = events.removeListener.bind(events)
 exports.crawlSite = async function (archive, crawlSource) {
   return doCrawl(archive, crawlSource, 'crawl_site_descriptions', TABLE_VERSION, async ({changes, resetRequired}) => {
     const supressEvents = resetRequired === true // dont emit when replaying old info
-    logger.silly('Crawling site descriptions', {url: archive.url, numChanges: changes.length, resetRequired})
+    logger.silly('Crawling site descriptions', {details: {url: archive.url, numChanges: changes.length, resetRequired}})
     if (resetRequired) {
       // reset all data
-      logger.silly('Resetting dataset', {url: archive.url})
+      logger.debug('Resetting dataset', {details: {url: archive.url}})
       await db.run(`
         DELETE FROM crawl_site_descriptions WHERE crawlSourceId = ?
       `, [crawlSource.id])
@@ -74,7 +74,11 @@ exports.crawlSite = async function (archive, crawlSource) {
 
     // collect changed site descriptions
     var changedSiteDescriptions = getMatchingChangesInOrder(changes, JSON_PATH_REGEX)
-    logger.silly('Collected changed site-descriptions', {changedPosts: changedSiteDescriptions.map(p => p.name)})
+    if (changedSiteDescriptions.length > 0) {
+      logger.debug('Collected new/changed site-description files', {details: {url: archive.url, changedPosts: changedSiteDescriptions.map(p => p.name)}})
+    } else {
+      logger.debug('No new site-description files found', {details: {url: archive.url}})
+    }
     emitProgressEvent(archive.url, 'crawl_site_descriptions', 0, changedSiteDescriptions.length)
 
     // read and apply each post in order
@@ -100,7 +104,7 @@ exports.crawlSite = async function (archive, crawlSource) {
         try {
           descString = await archive.pda.readFile(changedSiteDescription.name, 'utf8')
         } catch (err) {
-          logger.warn('Failed to read dat.json file, aborting', {url: archive.url, name: changedSiteDescription.name, err})
+          logger.warn('Failed to read dat.json file, aborting', {details: {url: archive.url, name: changedSiteDescription.name, err}})
           return // abort indexing
         }
 
@@ -110,7 +114,7 @@ exports.crawlSite = async function (archive, crawlSource) {
           desc = JSON.parse(descString)
           assert(typeof desc === 'object', 'File be an object')
         } catch (err) {
-          logger.warn('Failed to parse dat.json file, aborting', {url: archive.url, name: changedSiteDescription.name, err})
+          logger.warn('Failed to parse dat.json file, aborting', {details: {url: archive.url, name: changedSiteDescription.name, err}})
           continue // skip
         }
 
@@ -136,7 +140,7 @@ exports.crawlSite = async function (archive, crawlSource) {
       }
 
       // checkpoint our progress
-      logger.silly(`Finished crawling site descriptions`, {url: archive.url})
+      logger.silly(`Finished crawling site descriptions`, {details: {url: archive.url}})
       await doCheckpoint('crawl_site_descriptions', TABLE_VERSION, crawlSource, changedSiteDescription.version)
       emitProgressEvent(archive.url, 'crawl_site_descriptions', ++progress, changedSiteDescription.length)
     }
@@ -264,8 +268,8 @@ exports.capture = async function (archive, subject) {
   // capture dat.json
   try {
     var datJson = JSON.parse(await subjectArchive.pda.readFile('/dat.json'))
-  } catch (e) {
-    logger.warn('Failed to read dat.json of subject archive', e)
+  } catch (err) {
+    logger.warn('Failed to read dat.json of subject archive', {details: {err}})
     throw new Error('Unabled to read subject dat.json')
   }
   await archive.pda.writeFile(`/data/known_sites/${hostname}/dat.json`, JSON.stringify(datJson))
diff --git a/dat/garbage-collector.js b/dat/garbage-collector.js
index c5f4359b..1c28db8e 100644
--- a/dat/garbage-collector.js
+++ b/dat/garbage-collector.js
@@ -1,3 +1,4 @@
+const ms = require('ms')
 const archivesDb = require('../dbs/archives')
 const datLibrary = require('./library')
 const {
@@ -35,6 +36,8 @@ exports.setup = function () {
  * @returns {Promise<CollectResult>}
  */
 const collect = exports.collect = async function ({olderThan, isOwner} = {}) {
+  logger.info('Running GC')
+
   // clear any scheduled GC
   if (nextGCTimeout) {
     clearTimeout(nextGCTimeout)
@@ -72,6 +75,7 @@ const collect = exports.collect = async function ({olderThan, isOwner} = {}) {
 
   // schedule the next GC
   schedule(DAT_GC_REGULAR_COLLECT_WAIT)
+  logger.debug(`Scheduling next run to happen in ${ms(DAT_GC_REGULAR_COLLECT_WAIT)}`)
 
   // return stats
   return {totalBytes, totalArchives: unusedArchives.length - skippedArchives, skippedArchives}
diff --git a/dat/library.js b/dat/library.js
index c9a4cb2a..e0d7586b 100644
--- a/dat/library.js
+++ b/dat/library.js
@@ -2,11 +2,11 @@ const emitStream = require('emit-stream')
 const EventEmitter = require('events')
 const datEncoding = require('dat-encoding')
 const pify = require('pify')
-const pda = require('pauls-dat-api')
 const signatures = require('sodium-signatures')
 const parseDatURL = require('parse-dat-url')
 const _debounce = require('lodash.debounce')
 const mkdirp = require('mkdirp')
+const logger = require('../logger').child({category: 'dat', subcategory: 'library'})
 
 // dbs
 const siteData = require('../dbs/sitedata')
@@ -141,6 +141,7 @@ exports.setup = async function setup ({rpcAPI, datDaemonProcess, disallowedSaveP
 
   // start the GC manager
   datGC.setup()
+  logger.info('Initialized dat library')
 }
 
 /**
diff --git a/logger.js b/logger.js
index 4f17224f..96a6536b 100644
--- a/logger.js
+++ b/logger.js
@@ -55,7 +55,7 @@ exports.setup = async function (p) {
     format: combine(colorize(), padLevels(), simple())
   }))
 
-  logger.verbose('Program start')
+  logger.info('Program start')
 }
 
 exports.get = () => logger
diff --git a/users/index.js b/users/index.js
index 8f8770d4..a1954a70 100644
--- a/users/index.js
+++ b/users/index.js
@@ -57,7 +57,7 @@ exports.setup = async function () {
     user.archive = null
     user.isDefault = Boolean(user.isDefault)
     user.createdAt = new Date(user.createdAt)
-    logger.verbose('Loading user', user)
+    logger.info('Loading user', {details: user})
 
     // fetch the user archive
     try {
@@ -66,7 +66,7 @@ exports.setup = async function () {
       /* dont await */crawler.watchSite(user.archive)
       events.emit('load-user', user)
     } catch (err) {
-      logger.error('Failed to load user', {user, err})
+      logger.error('Failed to load user', {details: {user, err}})
     }
   })
 }
@@ -86,6 +86,7 @@ async function tick () {
 
     // assemble the next set of crawl targets
     var crawlTargets = await selectNextCrawlTargets(user)
+    logger.verbose(`Selected ${crawlTargets.length} crawl targets`, {details: {urls: crawlTargets}})
 
     // trigger the crawls on each
     var activeCrawls = crawlTargets.map(async (crawlTarget) => {
@@ -109,7 +110,7 @@ async function tick () {
     // await all crawls
     await Promise.all(activeCrawls)
   } catch (e) {
-    logger.error('Crawler tick failed', e)
+    logger.error('Crawler tick failed', {details: e})
   }
 
   // queue next tick
@@ -165,7 +166,7 @@ exports.add = async function (url) {
     isDefault: users.length === 0,
     createdAt: Date.now()
   }
-  logger.verbose('Adding user', user)
+  logger.verbose('Adding user', {details: user})
   await db.run(
     `INSERT INTO users (url, isDefault, createdAt) VALUES (?, ?, ?)`,
     [user.url, Number(user.isDefault), user.createdAt]
@@ -189,7 +190,7 @@ exports.remove = async function (url) {
   if (!user) return
 
   // remove the user
-  logger.verbose('Removing user', user)
+  logger.verbose('Removing user', {details: user})
   users.splice(users.indexOf(user), 1)
   await db.run(`DELETE FROM users WHERE url = ?`, [user.url])
   /* dont await */crawler.unwatchSite(user.archive)

From ccea1718c8a4190ad56db9644dd95631894cefdf Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 21 Jan 2019 19:45:07 -0600
Subject: [PATCH 074/245] Add logging to the dat components

---
 crawler/followgraph.js       |  2 +-
 crawler/posts.js             |  2 +-
 crawler/published-sites.js   |  2 +-
 crawler/site-descriptions.js |  2 +-
 dat/daemon/folder-sync.js    | 38 +++++++++++++++++-------------------
 dat/daemon/index.js          | 29 +++++++++++++++++++++------
 dat/daemon/logger.js         | 32 ++++++++++++++++++++++++++++++
 dat/daemon/logging-utils.js  | 24 +++++++++++------------
 dat/daemon/manifest.js       |  2 ++
 dat/daemon/storage.js        |  3 ++-
 dat/dns.js                   |  6 ++++++
 dat/library.js               |  9 ++++++++-
 logger.js                    |  2 +-
 package.json                 |  2 +-
 users/index.js               |  2 +-
 15 files changed, 110 insertions(+), 47 deletions(-)
 create mode 100644 dat/daemon/logger.js

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index 433d17df..19ade43e 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -68,7 +68,7 @@ exports.crawlSite = async function (archive, crawlSource) {
       return
     }
 
-    logger.debug('Change detected to follows record', {details: {url: archive.url}})
+    logger.verbose('Change detected to follows record', {details: {url: archive.url}})
     emitProgressEvent(archive.url, 'crawl_followgraph', 0, 1)
 
     // read and validate
diff --git a/crawler/posts.js b/crawler/posts.js
index 469c4f08..b3932892 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -67,7 +67,7 @@ exports.crawlSite = async function (archive, crawlSource) {
     // collect changed posts
     var changedPosts = getMatchingChangesInOrder(changes, JSON_PATH_REGEX)
     if (changedPosts.length) {
-      logger.debug('Collected new/changed post files', {details: {url: archive.url, changedPosts: changedPosts.map(p => p.name)}})
+      logger.verbose('Collected new/changed post files', {details: {url: archive.url, changedPosts: changedPosts.map(p => p.name)}})
     } else {
       logger.debug('No new post-files found', {details: {url: archive.url}})
     }
diff --git a/crawler/published-sites.js b/crawler/published-sites.js
index dc88285d..fd356e0a 100644
--- a/crawler/published-sites.js
+++ b/crawler/published-sites.js
@@ -72,7 +72,7 @@ exports.crawlSite = async function (archive, crawlSource) {
       return
     }
 
-    logger.debug('Change detected to published-sites record', {details: {url: archive.url}})
+    logger.verbose('Change detected to published-sites record', {details: {url: archive.url}})
     emitProgressEvent(archive.url, 'crawl_published_sites', 0, 1)
 
     // read and validate
diff --git a/crawler/site-descriptions.js b/crawler/site-descriptions.js
index 061b03f1..964f1458 100644
--- a/crawler/site-descriptions.js
+++ b/crawler/site-descriptions.js
@@ -75,7 +75,7 @@ exports.crawlSite = async function (archive, crawlSource) {
     // collect changed site descriptions
     var changedSiteDescriptions = getMatchingChangesInOrder(changes, JSON_PATH_REGEX)
     if (changedSiteDescriptions.length > 0) {
-      logger.debug('Collected new/changed site-description files', {details: {url: archive.url, changedPosts: changedSiteDescriptions.map(p => p.name)}})
+      logger.verbose('Collected new/changed site-description files', {details: {url: archive.url, changedPosts: changedSiteDescriptions.map(p => p.name)}})
     } else {
       logger.debug('No new site-description files found', {details: {url: archive.url}})
     }
diff --git a/dat/daemon/folder-sync.js b/dat/daemon/folder-sync.js
index ea4f1cff..b79e5eee 100644
--- a/dat/daemon/folder-sync.js
+++ b/dat/daemon/folder-sync.js
@@ -8,6 +8,7 @@ const EventEmitter = require('events')
 const pda = require('pauls-dat-api')
 const mkdirp = require('mkdirp')
 const {toAnymatchRules} = require('@beaker/datignore')
+const logger = require('./logger').child({category: 'dat', subcategory: 'folder-sync'})
 const {isFileNameBinary, isFileContentBinary} = require('../../lib/mime')
 const lock = require('../../lib/lock')
 const scopedFSes = require('../../lib/scoped-fses')
@@ -85,7 +86,7 @@ const queueSyncEvent = exports.queueSyncEvent = function (archive, {toFolder, to
   }
 
   // ignore if currently syncing
-  if (archive.syncEventQueue.isSyncing) return console.log('already syncing, ignored')
+  if (archive.syncEventQueue.isSyncing) return logger.silly('Already syncing, ignored')
 
   // debounce the handler
   if (archive.syncEventQueue.timeout) {
@@ -101,7 +102,7 @@ const queueSyncEvent = exports.queueSyncEvent = function (archive, {toFolder, to
 
     // lock
     archive.syncEventQueue.isSyncing = true
-    console.log('ok timed out, beginning sync', {toArchive, toFolder})
+    logger.silly('Ok timed out, beginning sync', {details: {toArchive, toFolder}})
 
     try {
       let st = await stat(fs, localSyncPath)
@@ -109,14 +110,14 @@ const queueSyncEvent = exports.queueSyncEvent = function (archive, {toFolder, to
         // folder has been removed
         archive.stopWatchingLocalFolder()
         archive.stopWatchingLocalFolder = null
-        console.error('Local sync folder not found, aborting watch', localSyncPath)
+        logger.warn('Local sync folder not found, aborting watch', {details: {path: localSyncPath}})
         return
       }
       // sync with priority given to the local folder
       if (toArchive) await syncFolderToArchive(archive, {localSyncPath, shallow: false})
       else if (toFolder) await syncArchiveToFolder(archive, {localSyncPath, shallow: false})
     } catch (e) {
-      console.error('Error syncing folder', localSyncPath, e)
+      logger.error('Error syncing folder', {details: {path: localSyncPath, error: e.toString()}})
       if (e.name === 'CycleError') {
         events.emit('error', archive.key, e)
       }
@@ -132,8 +133,6 @@ function newQueueObj () {
 
 // attach/detach a watcher on the local folder and sync it to the dat
 exports.configureFolderToArchiveWatcher = async function (archive) {
-  console.log('configureFolderToArchiveWatcher()', archive.localSyncSettings, !!archive.stopWatchingLocalFolder)
-
   // HACKish
   // it's possible that configureFolderToArchiveWatcher() could be called multiple times in sequence
   // (for instance because of multiple settings changes)
@@ -168,6 +167,8 @@ exports.configureFolderToArchiveWatcher = async function (archive) {
   // =
 
   if (archive.localSyncSettings) {
+    logger.silly('Configuring archive sync', {details: {key: archive.key.toString('hex'), settings: archive.localSyncSettings}})
+
     // create diff cache
     archive._compareContentCache = {}
 
@@ -180,7 +181,7 @@ exports.configureFolderToArchiveWatcher = async function (archive) {
     let st = await stat(fs, archive.localSyncSettings.path)
     if (shouldAbort()) return
     if (!st) {
-      console.error('Local sync folder not found, aborting watch', archive.localSyncSettings.path)
+      logger.warn('Local sync folder not found, aborting watch', {details: {path: archive.localSyncSettings.path}})
     }
     var scopedFS = scopedFSes.get(archive.localSyncSettings.path)
 
@@ -199,8 +200,8 @@ exports.configureFolderToArchiveWatcher = async function (archive) {
       // sync up
       try {
         await mergeArchiveAndFolder(archive, archive.localSyncSettings.path)
-      } catch (e) {
-        console.error('Failed to merge local sync folder', e)
+      } catch (err) {
+        logger.error('Failed to merge local sync folder', {details: {err}})
       }
       if (shouldAbort()) return
 
@@ -214,7 +215,7 @@ exports.configureFolderToArchiveWatcher = async function (archive) {
         //  B. maintain an in-memory copy of the datignore and keep it up-to-date, and then check at time of the event
         // -prf
 
-        console.log('changed detected', path)
+        logger.silly('Change detected', {details: {path}})
         queueSyncEvent(archive, {toArchive: true})
       })
     }
@@ -233,7 +234,7 @@ exports.configureFolderToArchiveWatcher = async function (archive) {
 exports.diffListing = async function (archive, opts = {}) {
   opts = opts || {}
   var localSyncPath = opts.localSyncPath || (archive.localSyncSettings && archive.localSyncSettings.path)
-  if (!localSyncPath) return console.log(new Error('diffListing() aborting, no localSyncPath')) // sanity check
+  if (!localSyncPath) return logger.warn('Sanity check failed - diffListing() aborting, no localSyncPath')
   var scopedFS = scopedFSes.get(localSyncPath)
   opts = massageDiffOpts(opts)
 
@@ -253,7 +254,7 @@ exports.diffListing = async function (archive, opts = {}) {
 // diff an individual file
 // - filepath: string, the path of the file in the archive/folder
 exports.diffFile = async function (archive, filepath) {
-  if (!archive.localSyncSettings.path) return console.log(new Error('diffFile() aborting, no localSyncPath')) // sanity check
+  if (!archive.localSyncSettings.path) return logger.warn('Sanity check failed - diffFile() aborting, no localSyncPath')
   var scopedFS = scopedFSes.get(archive.localSyncSettings.path)
   filepath = path.normalize(filepath)
 
@@ -326,7 +327,7 @@ exports.applyDatIgnoreFilter = function (archive, filepath) {
 
 // merge the dat.json in the folder and then merge files, with preference to folder files
 const mergeArchiveAndFolder = exports.mergeArchiveAndFolder = async function (archive, localSyncPath) {
-  console.log('merging archive with', localSyncPath)
+  logger.silly('Merging archive and folder', {details: {path: localSyncPath, key: archive.key.toString('hex')}})
   const readManifest = async (fs) => {
     try { return await pda.readManifest(fs) } catch (e) { return {} }
   }
@@ -338,7 +339,7 @@ const mergeArchiveAndFolder = exports.mergeArchiveAndFolder = async function (ar
   await sync(archive, false, {localSyncPath, shallow: false, addOnly: true}) // archive -> folder (add-only)
   await sync(archive, true, {localSyncPath, shallow: false}) // folder -> archive
   events.emit('merge:' + archive.key.toString('hex'), archive.key)
-  console.log('done merging archive with', localSyncPath)
+  logger.silly('Done merging archive and folder', {details: {path: localSyncPath, key: archive.key.toString('hex')}})
 }
 
 // internal methods
@@ -355,7 +356,7 @@ const mergeArchiveAndFolder = exports.mergeArchiveAndFolder = async function (ar
 async function sync (archive, toArchive, opts = {}) {
   opts = opts || {}
   var localSyncPath = opts.localSyncPath || (archive.localSyncSettings && archive.localSyncSettings.path)
-  if (!localSyncPath) return console.log(new Error('sync() aborting, no localSyncPath')) // sanity check
+  if (!localSyncPath) return logger.warn('Sanity check failed - sync() aborting, no localSyncPath')
 
   archive._activeSyncs = (archive._activeSyncs || 0) + 1
   var release = await getArchiveSyncLock(archive)
@@ -381,7 +382,7 @@ async function sync (archive, toArchive, opts = {}) {
     if (opts.addOnly) {
       diff = diff.filter(d => d.change === 'add')
     }
-    console.log('syncing to', toArchive ? 'archive' : 'folder', diff) // DEBUG
+    logger.silly(`Syncing to ${toArchive ? 'archive' : 'folder'}`, {details: {key: archive.key.toString('hex'), path: localSyncPath}})
 
     // sync data
     await dft.applyRight(left, right, diff)
@@ -391,10 +392,7 @@ async function sync (archive, toArchive, opts = {}) {
     // decrement active syncs
     archive._activeSyncs--
   } catch (err) {
-    console.error('Failed to sync archive to local path')
-    console.error('- Archive:', archive.key.toString('hex'))
-    console.error('- Path:', localSyncPath)
-    console.error('- Error:', err)
+    logger.error('Failed to sync archive to local path', {details: {key: archive.key.toString('hex'), path: localSyncPath, err: err.toString()}})
   } finally {
     release()
   }
diff --git a/dat/daemon/index.js b/dat/daemon/index.js
index 2fb1d15c..842e335c 100644
--- a/dat/daemon/index.js
+++ b/dat/daemon/index.js
@@ -23,6 +23,8 @@ const discoverySwarm = require('discovery-swarm')
 const networkSpeed = require('hyperdrive-network-speed')
 const {ThrottleGroup} = require('stream-throttle')
 
+const baseLogger = require('./logger')
+const logger = baseLogger.child({category: 'dat', subcategory: 'daemon'})
 const datStorage = require('./storage')
 const folderSync = require('./folder-sync')
 const {addArchiveSwarmLogging} = require('./logging-utils')
@@ -38,7 +40,6 @@ var datPath
 var networkId = crypto.randomBytes(32)
 var archives = {} // in-memory cache of archive objects. key -> archive
 var archivesByDKey = {} // same, but discoveryKey -> archive
-var archiveLoadPromises = {} // key -> promise
 var daemonEvents = new EventEmitter()
 var debugEvents = new EventEmitter()
 var debugLogFile
@@ -93,7 +94,9 @@ exports.setup = async function ({rpcAPI, logfilePath}) {
   addArchiveSwarmLogging({archivesByDKey, log, archiveSwarm})
   archiveSwarm.once('error', () => archiveSwarm.listen(0))
   archiveSwarm.listen(DAT_SWARM_PORT)
-  archiveSwarm.on('error', error => log(null, {event: 'swarm-error', message: error.toString()}))
+  archiveSwarm.on('error', error => log(null, {event: 'swarm-error', message: error.toString()}, 'warn'))
+
+  logger.info('Initialized dat daemon')
 }
 
 // rpc api
@@ -114,6 +117,7 @@ const RPC_API = {
 
   // up/down are in MB/s
   async setBandwidthThrottle ({up, down}) {
+    logger.info('Setting bandwidth throttle', {details: {up, down}})
     if (typeof up !== 'undefined') {
       upThrottleGroup = up ? new ThrottleGroup({rate: up * 1e6}) : null
     }
@@ -125,6 +129,10 @@ const RPC_API = {
   // event streams & debug
   // =
 
+  createLogStream () {
+    return emitStream(baseLogger.events)
+  },
+
   createEventStream () {
     return emitStream(daemonEvents)
   },
@@ -183,8 +191,10 @@ const RPC_API = {
       metaPath,
       userSettings
     } = opts
+    var logDetails = {key: key.toString('hex')}
 
     // create the archive instance
+    logger.verbose('Loading archive', {details: logDetails})
     var archive = hyperdrive(datStorage.create(metaPath), key, {
       sparse: true,
       secretKey
@@ -194,7 +204,7 @@ const RPC_API = {
     })
     archive.on('error', err => {
       let k = key.toString('hex')
-      log(k, {event: 'archive-error', message: err.toString()})
+      log(k, {event: 'archive-error', message: err.toString()}, 'warn')
       console.error('Error in archive', k, err)
     })
     archive.metadata.on('peer-add', () => onNetworkChanged(archive))
@@ -210,6 +220,7 @@ const RPC_API = {
         else resolve()
       })
     })
+    logger.silly('Archive ready', {details: {key: logDetails}})
     await updateSizeTracking(archive)
 
     // attach extensions
@@ -268,6 +279,7 @@ const RPC_API = {
     if (!archive) {
       return
     }
+    logger.verbose('Unloading archive', {details: {key}})
 
     // shutdown archive
     leaveSwarm(key)
@@ -321,6 +333,7 @@ const RPC_API = {
     if (!archive || archive.writable) {
       return // abort, only clear the content cache of downloaded archives
     }
+    logger.info('Clearing archive file cache', {details: {key: key.toString('hex')}})
 
     // clear the cache
     await new Promise((resolve, reject) => {
@@ -596,7 +609,7 @@ function createReplicationStream (info) {
       peer: `${info.host}:${info.port}`,
       connectionType: info.type,
       message: err.toString()
-    })
+    }, 'warn')
   })
 
   return stream
@@ -652,7 +665,7 @@ function getInternalLocalSyncPath (archiveOrKey) {
 // helpers
 // =
 
-function log (key, data) {
+function log (key, data, logLevel = false) {
   var keys = Array.isArray(key) ? key : [key]
   keys.forEach(k => {
     let data2 = Object.assign(data, {archiveKey: k})
@@ -662,4 +675,8 @@ function log (key, data) {
   if (keys[0]) {
     debugLogFile.append(keys[0] + JSON.stringify(data) + '\n')
   }
-}
+  if (logLevel) {
+    let message = data.event + (data.message ? `: ${data.message}` : '')
+    logger.log(logLevel, message, {details: {peer: data.peer}})
+  }
+}
\ No newline at end of file
diff --git a/dat/daemon/logger.js b/dat/daemon/logger.js
new file mode 100644
index 00000000..e5b07c5e
--- /dev/null
+++ b/dat/daemon/logger.js
@@ -0,0 +1,32 @@
+/**
+ * This logger is just an event-emitter wrapper which streams to the main process.
+ * The main process then folds the events into the main logger.
+ */
+
+const Emitter = require('events')
+
+// globals
+// =
+
+const events = new Emitter()
+
+// exported api
+// =
+
+exports.events = events
+
+exports.child = (meta = {}) => {
+  const log = (level, message, etc = {}) => {
+    Object.assign(etc, meta)
+    events.emit('log', {level, message, etc})
+  }
+  return {
+    log,
+    error: (...args) => log('error', ...args),
+    warn: (...args) => log('warn', ...args),
+    info: (...args) => log('info', ...args),
+    verbose: (...args) => log('verbose', ...args),
+    debug: (...args) => log('debug', ...args),
+    silly: (...args) => log('silly', ...args)
+  }
+}
\ No newline at end of file
diff --git a/dat/daemon/logging-utils.js b/dat/daemon/logging-utils.js
index 17b8b984..29f2d90c 100644
--- a/dat/daemon/logging-utils.js
+++ b/dat/daemon/logging-utils.js
@@ -45,7 +45,7 @@ const addArchiveSwarmLogging = exports.addArchiveSwarmLogging = function ({archi
         messageId: details.message.id,
         message: renderDNSTraffic(details.message),
         peer: details.peer ? `${details.peer.address || details.peer.host}:${details.peer.port}` : undefined
-      })
+      }, 'silly')
     })
   })
   archiveSwarm.on('peer', (peer) => {
@@ -54,7 +54,7 @@ const addArchiveSwarmLogging = exports.addArchiveSwarmLogging = function ({archi
     log(datEncoding.toStr(archive.key), {
       event: 'peer-found',
       peer: `${peer.address || peer.host}:${peer.port}`
-    })
+    }, 'silly')
   })
   archiveSwarm.on('peer-banned', (peer, details) => {
     let archive = archivesByDKey[findFullDiscoveryKey(archivesByDKey, peer.channel)]
@@ -63,7 +63,7 @@ const addArchiveSwarmLogging = exports.addArchiveSwarmLogging = function ({archi
       event: 'peer-banned',
       peer: `${peer.address || peer.host}:${peer.port}`,
       message: peerBannedReason(details.reason)
-    })
+    }, 'info')
   })
   archiveSwarm.on('peer-rejected', (peer, details) => {
     let archive = archivesByDKey[findFullDiscoveryKey(archivesByDKey, peer.channel)]
@@ -72,7 +72,7 @@ const addArchiveSwarmLogging = exports.addArchiveSwarmLogging = function ({archi
       event: 'peer-rejected',
       peer: `${peer.address || peer.host}:${peer.port}`,
       message: peerRejectedReason(details.reason)
-    })
+    }, 'silly')
   })
   archiveSwarm.on('drop', (peer) => {
     let archive = archivesByDKey[findFullDiscoveryKey(archivesByDKey, peer.channel)]
@@ -81,7 +81,7 @@ const addArchiveSwarmLogging = exports.addArchiveSwarmLogging = function ({archi
       event: 'peer-dropped',
       peer: `${peer.address || peer.host}:${peer.port}`,
       message: 'Too many failed connection attempts'
-    })
+    }, 'silly')
   })
   archiveSwarm.on('connecting', (peer) => {
     let archive = archivesByDKey[findFullDiscoveryKey(archivesByDKey, peer.channel)]
@@ -89,7 +89,7 @@ const addArchiveSwarmLogging = exports.addArchiveSwarmLogging = function ({archi
     log(datEncoding.toStr(archive.key), {
       event: 'connecting',
       peer: `${peer.address || peer.host}:${peer.port}`
-    })
+    }, 'debug')
   })
   archiveSwarm.on('connect-failed', (peer, details) => {
     let archive = archivesByDKey[findFullDiscoveryKey(archivesByDKey, peer.channel)]
@@ -98,7 +98,7 @@ const addArchiveSwarmLogging = exports.addArchiveSwarmLogging = function ({archi
       event: 'connect-failed',
       peer: `${peer.address || peer.host}:${peer.port}`,
       message: connectFailedMessage(details)
-    })
+    }, 'debug')
   })
   archiveSwarm.on('handshaking', (conn, peer) => {
     let archive = archivesByDKey[findFullDiscoveryKey(archivesByDKey, peer.channel)]
@@ -109,7 +109,7 @@ const addArchiveSwarmLogging = exports.addArchiveSwarmLogging = function ({archi
       connectionId: conn._debugId,
       connectionType: peer.type,
       ts: 0
-    })
+    }, 'silly')
   })
   archiveSwarm.on('handshake-timeout', (conn, peer) => {
     let archive = archivesByDKey[findFullDiscoveryKey(archivesByDKey, peer.channel)]
@@ -120,7 +120,7 @@ const addArchiveSwarmLogging = exports.addArchiveSwarmLogging = function ({archi
       connectionId: conn._debugId,
       connectionType: peer.type,
       ts: Date.now() - conn._debugStartTime
-    })
+    }, 'silly')
   })
   archiveSwarm.on('connection', (conn, peer) => {
     let archive = archivesByDKey[findFullDiscoveryKey(archivesByDKey, peer.channel)]
@@ -132,7 +132,7 @@ const addArchiveSwarmLogging = exports.addArchiveSwarmLogging = function ({archi
       connectionType: peer.type,
       ts: Date.now() - conn._debugStartTime,
       message: 'Starting replication'
-    })
+    }, 'debug')
   })
   archiveSwarm.on('redundant-connection', (conn, peer) => {
     let archive = archivesByDKey[findFullDiscoveryKey(archivesByDKey, peer.channel)]
@@ -143,7 +143,7 @@ const addArchiveSwarmLogging = exports.addArchiveSwarmLogging = function ({archi
       connectionId: conn._debugId,
       connectionType: peer.type,
       ts: Date.now() - conn._debugStartTime
-    })
+    }, 'silly')
   })
   archiveSwarm.on('connection-closed', (conn, peer) => {
     let archive = archivesByDKey[findFullDiscoveryKey(archivesByDKey, peer.channel)]
@@ -154,7 +154,7 @@ const addArchiveSwarmLogging = exports.addArchiveSwarmLogging = function ({archi
       connectionId: conn._debugId,
       connectionType: peer.type,
       ts: Date.now() - conn._debugStartTime
-    })
+    }, 'debug')
   })
 }
 
diff --git a/dat/daemon/manifest.js b/dat/daemon/manifest.js
index f4baab22..40c18e0d 100644
--- a/dat/daemon/manifest.js
+++ b/dat/daemon/manifest.js
@@ -4,6 +4,7 @@
  * @typedef {Object} DatDaemon
  * @prop {function(DatDaemonSetupOpts): Promise<void>} setup
  * @prop {function(DatDaemonThrottleOpts): Promise<void>} setBandwidthThrottle
+ * @prop {function(): NodeJS.ReadableStream} createLogStream
  * @prop {function(): NodeJS.ReadableStream} createEventStream
  * @prop {function(): NodeJS.ReadableStream} createDebugStream
  * @prop {function(string): Promise<string>} getDebugLog
@@ -102,6 +103,7 @@ module.exports = {
 
   // event streams & debug
 
+  createLogStream: 'readable',
   createEventStream: 'readable',
   createDebugStream: 'readable',
   getDebugLog: 'promise',
diff --git a/dat/daemon/storage.js b/dat/daemon/storage.js
index 6bf1ec2f..a2215846 100644
--- a/dat/daemon/storage.js
+++ b/dat/daemon/storage.js
@@ -3,6 +3,7 @@ const fs = require('fs')
 const detectSparseFiles = require('supports-sparse-files')
 const raf = require('random-access-file')
 const raif = require('random-access-indexed-file')
+const logger = require('./logger').child({category: 'dat', subcategory: 'storage'})
 
 // globals
 // =
@@ -22,7 +23,7 @@ exports.setup = async function () {
     detectSparseFiles(function (err, yes) {
       supportsSparseFiles = yes
       if (!yes) {
-        console.log('Sparse-file support not detected. Falling back to indexed data files.')
+        logger.info('Sparse-file support not detected. Falling back to indexed data files.')
       }
       resolve()
     })
diff --git a/dat/dns.js b/dat/dns.js
index eb911c59..1b5cf221 100644
--- a/dat/dns.js
+++ b/dat/dns.js
@@ -1,6 +1,7 @@
 const {InvalidDomainName} = require('beaker-error-constants')
 const sitedataDb = require('../dbs/sitedata')
 const {DAT_HASH_REGEX} = require('../lib/const')
+const logger = require('../logger').child({category: 'dat', subcategory: 'dns'})
 
 // instantate a dns cache and export it
 const datDns = require('dat-dns')({
@@ -8,6 +9,11 @@ const datDns = require('dat-dns')({
 })
 module.exports = datDns
 
+// hook up log events
+datDns.on('resolved', details => logger.debug('Resolved', {details}))
+datDns.on('failed', details => logger.debug('Failed lookup', {details}))
+datDns.on('cache-flushed', details => logger.debug('Cache flushed'))
+
 // wrap resolveName() with a better error
 const resolveName = datDns.resolveName
 datDns.resolveName = function () {
diff --git a/dat/library.js b/dat/library.js
index e0d7586b..07e64fce 100644
--- a/dat/library.js
+++ b/dat/library.js
@@ -6,7 +6,8 @@ const signatures = require('sodium-signatures')
 const parseDatURL = require('parse-dat-url')
 const _debounce = require('lodash.debounce')
 const mkdirp = require('mkdirp')
-const logger = require('../logger').child({category: 'dat', subcategory: 'library'})
+const baseLogger = require('../logger').get()
+const logger = baseLogger.child({category: 'dat', subcategory: 'library'})
 
 // dbs
 const siteData = require('../dbs/sitedata')
@@ -97,6 +98,12 @@ exports.setup = async function setup ({rpcAPI, datDaemonProcess, disallowedSaveP
   daemon.setup({disallowedSavePaths, datPath: archivesDb.getDatPath()})
   daemonEvents = emitStream(daemon.createEventStream())
 
+  // pipe the log
+  var daemonLogEvents = emitStream(daemon.createLogStream())
+  daemonLogEvents.on('log', ({level, message, etc}) => {
+    baseLogger.log(level, message, etc)
+  })
+
   // wire up event handlers
   archivesDb.on('update:archive-user-settings', async (key, userSettings, newUserSettings) => {
     // emit event
diff --git a/logger.js b/logger.js
index 96a6536b..ac91c714 100644
--- a/logger.js
+++ b/logger.js
@@ -51,7 +51,7 @@ exports.setup = async function (p) {
 
   // TODO if debug (pick an env var for this)
   logger.add(new winston.transports.Console({
-    level: 'debug',
+    level: 'verbose',
     format: combine(colorize(), padLevels(), simple())
   }))
 
diff --git a/package.json b/package.json
index d77089ee..8f31c3a5 100644
--- a/package.json
+++ b/package.json
@@ -35,7 +35,7 @@
     "bytes": "^3.0.0",
     "circular-append-file": "^1.0.1",
     "concat-stream": "^1.6.2",
-    "dat-dns": "^3.0.2",
+    "dat-dns": "^3.1.0",
     "dat-encoding": "^5.0.1",
     "datland-swarm-defaults": "^1.0.2",
     "diff": "^3.5.0",
diff --git a/users/index.js b/users/index.js
index a1954a70..ef16b455 100644
--- a/users/index.js
+++ b/users/index.js
@@ -86,7 +86,7 @@ async function tick () {
 
     // assemble the next set of crawl targets
     var crawlTargets = await selectNextCrawlTargets(user)
-    logger.verbose(`Selected ${crawlTargets.length} crawl targets`, {details: {urls: crawlTargets}})
+    logger.verbose(`Indexing ${crawlTargets.length} sites`, {details: {urls: crawlTargets}})
 
     // trigger the crawls on each
     var activeCrawls = crawlTargets.map(async (crawlTarget) => {

From 6129c5d96f4d1ba456fb635d596d97d4f8860d7b Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 21 Jan 2019 21:18:23 -0600
Subject: [PATCH 075/245] Tweak dat logging

---
 dat/daemon/index.js         | 2 +-
 dat/daemon/logging-utils.js | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/dat/daemon/index.js b/dat/daemon/index.js
index 842e335c..70ddcf6e 100644
--- a/dat/daemon/index.js
+++ b/dat/daemon/index.js
@@ -677,6 +677,6 @@ function log (key, data, logLevel = false) {
   }
   if (logLevel) {
     let message = data.event + (data.message ? `: ${data.message}` : '')
-    logger.log(logLevel, message, {details: {peer: data.peer}})
+    logger.log(logLevel, message, {details: {key, peer: data.peer}})
   }
 }
\ No newline at end of file
diff --git a/dat/daemon/logging-utils.js b/dat/daemon/logging-utils.js
index 29f2d90c..df028362 100644
--- a/dat/daemon/logging-utils.js
+++ b/dat/daemon/logging-utils.js
@@ -45,7 +45,7 @@ const addArchiveSwarmLogging = exports.addArchiveSwarmLogging = function ({archi
         messageId: details.message.id,
         message: renderDNSTraffic(details.message),
         peer: details.peer ? `${details.peer.address || details.peer.host}:${details.peer.port}` : undefined
-      }, 'silly')
+      })
     })
   })
   archiveSwarm.on('peer', (peer) => {

From 16b0dac53614e540840b1d235bf711bc77d24941 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 23 Jan 2019 20:47:54 -0600
Subject: [PATCH 076/245] Rework posts to be links

---
 crawler/followgraph.js                  |  12 +-
 crawler/json-schemas/follows.js         |  30 +++
 crawler/json-schemas/post.js            |  59 ++++++
 crawler/json-schemas/published-sites.js |  29 +++
 crawler/posts.js                        |  81 +++++---
 crawler/published-sites.js              |  12 +-
 crawler/search.js                       | 256 +++++++++++++-----------
 dbs/schemas/profile-data.sql.js         |  15 +-
 dbs/schemas/profile-data.v24.sql.js     |  15 +-
 package-lock.json                       |  24 ++-
 package.json                            |   1 +
 web-apis/bg/posts.js                    |  12 +-
 12 files changed, 363 insertions(+), 183 deletions(-)
 create mode 100644 crawler/json-schemas/follows.js
 create mode 100644 crawler/json-schemas/post.js
 create mode 100644 crawler/json-schemas/published-sites.js

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index 19ade43e..a7983128 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -2,12 +2,14 @@ const assert = require('assert')
 const _difference = require('lodash.difference')
 const Events = require('events')
 const {URL} = require('url')
+const Ajv = require('ajv')
 const logger = require('../logger').child({category: 'crawler', dataset: 'followgraph'})
 const lock = require('../lib/lock')
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
 const siteDescriptions = require('./site-descriptions')
 const {doCrawl, doCheckpoint, emitProgressEvent} = require('./util')
+const followsSchema = require('./json-schemas/follows')
 
 // constants
 // =
@@ -28,7 +30,9 @@ const JSON_PATH = '/data/follows.json'
 // globals
 // =
 
-var events = new Events()
+const events = new Events()
+const ajv = (new Ajv())
+const validateFollows = ajv.compile(followsSchema)
 
 // exported api
 // =
@@ -331,10 +335,8 @@ async function readFollowsFile (archive) {
     throw e
   }
   followsJson = JSON.parse(followsJson)
-  assert(typeof followsJson === 'object', 'File be an object')
-  assert(followsJson.type === JSON_TYPE, 'JSON type must be unwalled.garden/follows')
-  assert(Array.isArray(followsJson.urls), 'JSON .urls must be an array of strings')
-  followsJson.urls = followsJson.urls.filter(v => typeof v === 'string').map(toOrigin)
+  var valid = validateFollows(followsJson)
+  if (!valid) throw ajv.errorsText(validateFollows.errors)
   return followsJson
 }
 
diff --git a/crawler/json-schemas/follows.js b/crawler/json-schemas/follows.js
new file mode 100644
index 00000000..5c87fe85
--- /dev/null
+++ b/crawler/json-schemas/follows.js
@@ -0,0 +1,30 @@
+module.exports = {
+  "$schema": "http://json-schema.org/draft-07/schema#",
+  "$id": "dat://unwalled.garden/follows.json",
+  "type": "object",
+  "title": "Follows",
+  "description": " A list of data subscriptions.",
+  "required": [
+    "type",
+    "urls"
+  ],
+  "properties": {
+    "type": {
+      "type": "string",
+      "title": "The object's type",
+      "const": "unwalled.garden/follows"
+    },
+    "urls": {
+      "type": "array",
+      "title": "The followed URLs",
+      "items": {
+        "type": "string",
+        "format": "uri",
+        "examples": [
+          "dat://beakerbrowser.com"
+        ]
+      }
+    }
+  },
+  "additionalProperties": false
+}
\ No newline at end of file
diff --git a/crawler/json-schemas/post.js b/crawler/json-schemas/post.js
new file mode 100644
index 00000000..1884757b
--- /dev/null
+++ b/crawler/json-schemas/post.js
@@ -0,0 +1,59 @@
+module.exports = {
+  "$schema": "http://json-schema.org/draft-07/schema#",
+  "$id": "dat://unwalled.garden/post.json",
+  "type": "object",
+  "title": "Post",
+  "description": "A short broadcast.",
+  "required": [
+    "type",
+    "content",
+    "createdAt"
+  ],
+  "properties": {
+    "type": {
+      "type": "string",
+      "title": "The object's type",
+      "const": "unwalled.garden/post"
+    },
+    "content": {
+      "type": "object",
+      "required": [
+        "url",
+        "title"
+      ],
+      "properties": {
+        "url": {
+          "type": "string",
+          "title": "The post's target URL",
+          "format": "uri",
+          "examples": [
+            "dat://beakerbrowser.com"
+          ]
+        },
+        "title": {
+          "type": "string"
+        },
+        "description": {
+          "type": "string"
+        },
+        "type": {
+          "type": "array",
+          "items": {
+            "type": "string"
+          }
+        }
+      }
+    },
+    "createdAt": {
+      "type": "string",
+      "format": "date-time",
+      "title": "The time of this post's creation"
+    },
+    "updatedAt": {
+      "type": "string",
+      "format": "date-time",
+      "title": "The time of this post's last edit"
+    }
+  },
+  "additionalProperties": false
+}
\ No newline at end of file
diff --git a/crawler/json-schemas/published-sites.js b/crawler/json-schemas/published-sites.js
new file mode 100644
index 00000000..8aaea76a
--- /dev/null
+++ b/crawler/json-schemas/published-sites.js
@@ -0,0 +1,29 @@
+module.exports = {
+  "$schema": "http://json-schema.org/draft-07/schema#",
+  "$id": "dat://unwalled.garden/published-sites.json",
+  "type": "object",
+  "title": "Published sites",
+  "description": "Sites published by the user.",
+  "required": [
+    "type"
+  ],
+  "properties": {
+    "type": {
+      "type": "string",
+      "title": "The object's type",
+      "const": "unwalled.garden/published-sites"
+    },
+    "urls": {
+      "type": "array",
+      "title": "The followed URLs",
+      "items": {
+        "type": "string",
+        "format": "uri",
+        "examples": [
+          "dat://beakerbrowser.com"
+        ]
+      }
+    }
+  },
+  "additionalProperties": false
+}
\ No newline at end of file
diff --git a/crawler/posts.js b/crawler/posts.js
index b3932892..5c0314da 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -1,11 +1,13 @@
 const assert = require('assert')
 const {URL} = require('url')
 const Events = require('events')
+const Ajv = require('ajv')
 const logger = require('../logger').child({category: 'crawler', dataset: 'posts'})
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
 const siteDescriptions = require('./site-descriptions')
 const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename} = require('./util')
+const postSchema = require('./json-schemas/post')
 
 // constants
 // =
@@ -24,7 +26,11 @@ const JSON_PATH_REGEX = /^\/data\/posts\/([^/]+)\.json$/i
  *
  * @typedef {Object} Post
  * @prop {string} pathname
- * @prop {string} content
+ * @prop {Object} content
+ * @prop {string} content.url
+ * @prop {string} content.title
+ * @prop {string} [content.description]
+ * @prop {string|string[]} [content.type]
  * @prop {number} crawledAt
  * @prop {number} createdAt
  * @prop {number} updatedAt
@@ -34,7 +40,10 @@ const JSON_PATH_REGEX = /^\/data\/posts\/([^/]+)\.json$/i
 // globals
 // =
 
-var events = new Events()
+const events = new Events()
+const ajv = (new Ajv())
+const validatePost = ajv.compile(postSchema)
+const validatePostContent = ajv.compile(postSchema.properties.content)
 
 // exported api
 // =
@@ -100,35 +109,34 @@ exports.crawlSite = async function (archive, crawlSource) {
         let post
         try {
           post = JSON.parse(postString)
-          assert(typeof post === 'object', 'File be an object')
-          assert(post.type === 'unwalled.garden/post', 'JSON type must be unwalled.garden/post')
-          assert(typeof post.content === 'string', 'JSON content must be a string')
-          assert(typeof post.createdAt === 'string', 'JSON createdAt must be a date-time')
-          assert(!isNaN(Number(new Date(post.createdAt))), 'JSON createdAt must be a date-time')
+          let valid = validatePost(post)
+          if (!valid) throw ajv.errorsText(validatePost.errors)
         } catch (err) {
           logger.warn('Failed to parse post file, skipping', {details: {url: archive.url, name: changedPost.name, err}})
           continue // skip
         }
 
         // massage the post
+        post.content.description = post.content.description || '' // optional
+        post.content.type = (post.content.type || ['']).join(',') // optional
         post.createdAt = Number(new Date(post.createdAt))
         post.updatedAt = Number(new Date(post.updatedAt))
-        if (isNaN(post.updatedAt)) post.updatedAt = 0 // value is optional
+        if (isNaN(post.updatedAt)) post.updatedAt = 0 // optional
 
         // upsert
         let existingPost = await get(archive.url, changedPost.name)
         if (existingPost) {
           await db.run(`
             UPDATE crawl_posts
-              SET crawledAt = ?, content = ?, createdAt = ?, updatedAt = ?
+              SET crawledAt = ?, url = ?, title = ?, description = ?, type = ?, createdAt = ?, updatedAt = ?
               WHERE crawlSourceId = ? AND pathname = ?
-          `, [Date.now(), post.content, post.createdAt, post.updatedAt, crawlSource.id, changedPost.name])
+          `, [Date.now(), post.content.url, post.content.title, post.content.description, post.content.type, post.createdAt, post.updatedAt, crawlSource.id, changedPost.name])
           events.emit('post-updated', archive.url)
         } else {
           await db.run(`
-            INSERT INTO crawl_posts (crawlSourceId, pathname, crawledAt, content, createdAt, updatedAt)
-              VALUES (?, ?, ?, ?, ?, ?)
-          `, [crawlSource.id, changedPost.name, Date.now(), post.content, post.createdAt, post.updatedAt])
+            INSERT INTO crawl_posts (crawlSourceId, pathname, crawledAt, url, title, description, type, createdAt, updatedAt)
+              VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?)
+          `, [crawlSource.id, changedPost.name, Date.now(), post.content.url, post.content.title, post.content.description, post.content.type, post.createdAt, post.updatedAt])
           events.emit('post-added', archive.url)
         }
       }
@@ -237,13 +245,17 @@ const get = exports.get = async function (url, pathname = undefined) {
  * Create a new post.
  *
  * @param {InternalDatArchive} archive - where to write the post to.
- * @param {Object} post
- * @param {string} post.content
+ * @param {Object} content
+ * @param {string} content.url
+ * @param {string} content.title
+ * @param {string} [content.description]
+ * @param {string|string[]} [content.type]
  * @returns {Promise}
  */
-exports.create = async function (archive, {content}) {
-  assert(typeof content === 'string', 'Create() must be provided a `content` string')
-  var filename = generateTimeFilename()
+exports.create = async function (archive, content) {
+  var valid = validatePostContent(content)
+  if (!valid) throw ajv.errorsText(validatePostContent.errors)
+    var filename = generateTimeFilename()
   await ensureDirectory(archive, '/data')
   await ensureDirectory(archive, '/data/posts')
   await archive.pda.writeFile(`/data/posts/${filename}.json`, JSON.stringify({
@@ -260,13 +272,16 @@ exports.create = async function (archive, {content}) {
  *
  * @param {InternalDatArchive} archive - where to write the post to.
  * @param {string} pathname - the pathname of the post.
- * @param {Object} post
- * @param {string} post.content
+ * @param {Object} content
+ * @param {string} content.url
+ * @param {string} content.title
+ * @param {string} [content.description]
+ * @param {string|string[]} [content.type]
  * @returns {Promise}
  */
-exports.edit = async function (archive, pathname, {content}) {
-  assert(typeof pathname === 'string', 'Edit() must be provided a valid URL string')
-  assert(typeof content === 'string', 'Edit() must be provided a `content` string')
+exports.edit = async function (archive, pathname, content) {
+  var valid = validatePostContent(content)
+  if (!valid) throw ajv.errorsText(validatePostContent.errors)
   var oldJson = JSON.parse(await archive.pda.readFile(pathname))
   await archive.pda.writeFile(pathname, JSON.stringify({
     type: JSON_TYPE,
@@ -327,9 +342,19 @@ async function ensureDirectory (archive, pathname) {
  */
 async function massagePostRow (row) {
   if (!row) return null
-  row.author = await siteDescriptions.getBest({subject: row.crawlSourceUrl})
-  if (!row.author) row.author = {url: row.crawlSourceUrl}
-  delete row.crawlSourceUrl
-  delete row.crawlSourceId
-  return row
+  var author = await siteDescriptions.getBest({subject: row.crawlSourceUrl})
+  if (!author) author = {url: row.crawlSourceUrl}
+  return {
+    pathname: row.pathname,
+    author,
+    content: {
+      url: row.url,
+      title: row.title,
+      description: row.description,
+      type: row.type.split(',')
+    },
+    crawledAt: row.crawledAt,
+    createdAt: row.createdAt,
+    updatedAt: row.updatedAt
+  }
 }
diff --git a/crawler/published-sites.js b/crawler/published-sites.js
index fd356e0a..987f239b 100644
--- a/crawler/published-sites.js
+++ b/crawler/published-sites.js
@@ -2,12 +2,14 @@ const assert = require('assert')
 const _difference = require('lodash.difference')
 const Events = require('events')
 const {URL} = require('url')
+const Ajv = require('ajv')
 const logger = require('../logger').child({category: 'crawler', dataset: 'published-sites'})
 const lock = require('../lib/lock')
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
 const siteDescriptions = require('./site-descriptions')
 const {doCrawl, doCheckpoint, emitProgressEvent} = require('./util')
+const publishedSitesSchema = require('./json-schemas/published-sites')
 
 // constants
 // =
@@ -32,7 +34,9 @@ const JSON_PATH = '/data/sites.json'
 // globals
 // =
 
-var events = new Events()
+const events = new Events()
+const ajv = (new Ajv())
+const validatePublishedSites = ajv.compile(publishedSitesSchema)
 
 // exported api
 // =
@@ -255,10 +259,8 @@ async function readSitesFile (archive) {
     throw e
   }
   sitesJson = JSON.parse(sitesJson)
-  assert(typeof sitesJson === 'object', 'File be an object')
-  assert(sitesJson.type === JSON_TYPE, 'JSON type must be unwalled.garden/published-sites')
-  assert(Array.isArray(sitesJson.urls), 'JSON .urls must be an array of strings')
-  sitesJson.urls = sitesJson.urls.filter(v => typeof v === 'string').map(toOrigin)
+  var valid = validatePublishedSites(sitesJson)
+  if (!valid) throw ajv.errorsText(validatePublishedSites.errors)
   return sitesJson
 }
 
diff --git a/crawler/search.js b/crawler/search.js
index a5698b80..95139188 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -42,13 +42,10 @@ const BUILTIN_PAGES = [
  *
  * @typedef {Object} SearchResults
  * @prop {number} highlightNonce - A number used to create perimeters around text that should be highlighted.
- * @prop {(null|PeopleSearchResult[])} people
- * @prop {(null|PostSearchResult[])} posts
- * @prop {(null|PageSearchResult[])} pages
- * @prop {(null|PageSearchResult[])} images
- * @prop {(null|PageSearchResult[])} files
+ * @prop {Array<UserSearchResult|SiteSearchResult|PostSearchResult>} results
  *
- * @typedef {Object} PeopleSearchResult
+ * @typedef {Object} UserSearchResult
+ * @prop {string} resultType
  * @prop {string} url
  * @prop {string} title
  * @prop {string} description
@@ -59,13 +56,20 @@ const BUILTIN_PAGES = [
  * @prop {string} author.url
  *
  * @typedef {Object} PostSearchResult
+ * @prop {string} resultType
  * @prop {string} url
  * @prop {SiteDescription} author
- * @prop {string} content
+ * @prop {Object} content
+ * @prop {string} content.url
+ * @prop {string} content.title
+ * @prop {string} content.description
+ * @prop {Array<string>} content.type
+ * @prop {number} crawledAt
  * @prop {number} createdAt
  * @prop {number} updatedAt
  *
- * @typedef {Object} PageSearchResult
+ * @typedef {Object} SiteSearchResult
+ * @prop {string} resultType
  * @prop {string} url
  * @prop {string} title
  * @prop {string} description
@@ -133,12 +137,7 @@ exports.listSuggestions = async function (query = '', opts = {}) {
  * @param {string} opts.user - The current user's URL.
  * @param {string} [opts.query] - The search query.
  * @param {number} [opts.hops=1] - How many hops out in the user's follow graph should be included?
- * @param {Object} [opts.types] - Content types to query. Defaults to all.
- * @param {boolean} [opts.types.people]
- * @param {boolean} [opts.types.posts]
- * @param {boolean} [opts.types.pages]
- * @param {boolean} [opts.types.images]
- * @param {boolean} [opts.types.files]
+ * @param {string} [opts.type] - Content type to query. Defaults to all except users.
  * @param {number} [opts.since] - Filter results to items created since the given timestamp.
  * @param {number} [opts.offset]
  * @param {number} [opts.limit = 20]
@@ -151,22 +150,10 @@ exports.listSearchResults = async function (opts) {
 
   var searchResults = {
     highlightNonce,
-    people: null,
-    posts: null,
-    pages: null,
-    images: null,
-    files: null
-  }
-  var {user, query, hops, types, since, offset, limit} = opts
-  if (!types || typeof types !== 'object') {
-    types = {}
-    // default to all
-    for (var k in searchResults) {
-      if (k !== 'highlightNonce') {
-        types[k] = true
-      }
-    }
+    results: []
   }
+  var {user, query, hops, type, since, offset, limit} = opts
+  type = type || 'all'
   since = since || 0
   offset = offset || 0
   limit = limit || 20
@@ -202,14 +189,17 @@ exports.listSearchResults = async function (opts) {
   }
 
   // run queries
-  if (types.people) {
+  if (type === 'all' || type === 'user') {
+    // FOLLOWS
+    let rows
     if (query) {
-      searchResults.people = await db.all(`
+      rows = await db.all(`
         SELECT
             desc.url AS url,
             descSrc.url AS authorUrl,
             SNIPPET(crawl_site_descriptions_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title,
-            SNIPPET(crawl_site_descriptions_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description
+            SNIPPET(crawl_site_descriptions_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description,
+            desc.crawledAt
           FROM crawl_site_descriptions_fts_index desc_fts
           INNER JOIN crawl_site_descriptions desc ON desc.rowid = desc_fts.rowid
           LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = desc.url
@@ -220,43 +210,54 @@ exports.listSearchResults = async function (opts) {
               fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) -- description by a followed user
               OR (desc.url = ? AND desc.crawlSourceId = ?) -- description by me about me
             )
-          ORDER BY rank
+            AND desc.crawledAt >= ?
+          ORDER BY desc.crawledAt
           LIMIT ?
           OFFSET ?;
-      `, [query, user, userCrawlSourceId, limit, offset])
+      `, [query, user, userCrawlSourceId, since, limit, offset])
     } else {
-      searchResults.people = await db.all(`
-        SELECT desc.url AS url, desc.title, desc.description, descSrc.url AS authorUrl
+      rows = await db.all(`
+        SELECT desc.url AS url, desc.title, desc.description, descSrc.url AS authorUrl, desc.crawledAt
           FROM crawl_site_descriptions desc
           LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = desc.url
           INNER JOIN crawl_sources descSrc ON desc.crawlSourceId = descSrc.id
-          WHERE (
-            fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) -- description by a followed user
-            OR (desc.url = ? AND desc.crawlSourceId = ?) -- description by me about me
-          )
-          ORDER BY desc.title
+          WHERE 
+            (
+              fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) -- description by a followed user
+              OR (desc.url = ? AND desc.crawlSourceId = ?) -- description by me about me
+            )
+            AND desc.crawledAt >= ?
+          ORDER BY desc.crawledAt
           LIMIT ?
           OFFSET ?;
-      `, [user, userCrawlSourceId, limit, offset])
+      `, [user, userCrawlSourceId, since, limit, offset])
     }
-    searchResults.people = _uniqWith(searchResults.people, (a, b) => a.url === b.url) // remove duplicates
-    await Promise.all(searchResults.people.map(async (p) => {
+    rows = _uniqWith(rows, (a, b) => a.url === b.url) // remove duplicates
+    await Promise.all(rows.map(async (p) => {
       // fetch additional info
       p.followedBy = await followgraph.listFollowers(p.url, {includeDesc: true})
       p.followsUser = await followgraph.isAFollowingB(p.url, user)
 
       // massage attrs
+      p.resultType = 'user'
       p.thumbUrl = getSiteDescriptionThumbnailUrl(p.authorUrl, p.url)
       p.author = {url: p.authorUrl}
       delete p.authorUrl
     }))
+    searchResults.results = searchResults.results.concat(rows)
   }
-  if (types.posts) {
+  {
+    // POSTS
+    let rows
     if (query) {
-      searchResults.posts = await db.all(`
+      rows = await db.all(`
         SELECT
-            SNIPPET(crawl_posts_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS content,
+            post.url,
+            SNIPPET(crawl_posts_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title,
+            SNIPPET(crawl_posts_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description,
+            post.type,
             post.pathname,
+            post.crawledAt,
             post.createdAt,
             post.updatedAt,
             postSrc.url AS authorUrl
@@ -267,96 +268,113 @@ exports.listSearchResults = async function (opts) {
           WHERE
             crawl_posts_fts_index MATCH ?
             AND (fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) OR post.crawlSourceId = ?)
-            AND post.createdAt >= ?
-          ORDER BY rank
+            AND post.crawledAt >= ?
+          ORDER BY post.crawledAt
           LIMIT ?
           OFFSET ?;
       `, [query, userCrawlSourceId, since, limit, offset])
     } else {
-      searchResults.posts = await db.all(`
-        SELECT post.content, post.pathname, post.createdAt, post.updatedAt, postSrc.url AS authorUrl
+      rows = await db.all(`
+        SELECT
+            post.url,
+            post.title,
+            post.description,
+            post.type,
+            post.pathname,
+            post.crawledAt,
+            post.createdAt,
+            post.updatedAt,
+            postSrc.url AS authorUrl
           FROM crawl_posts post
           INNER JOIN crawl_sources postSrc ON post.crawlSourceId = postSrc.id
           LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = postSrc.url 
           WHERE
             (fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) OR post.crawlSourceId = ?)
-            AND post.createdAt >= ?
-          ORDER BY post.createdAt DESC
+            AND post.crawledAt >= ?
+          ORDER BY post.crawledAt DESC
           LIMIT ?
           OFFSET ?;
       `, [userCrawlSourceId, since, limit, offset])
     }
-    await Promise.all(searchResults.posts.map(async (p) => {
+    searchResults.results = searchResults.results.concat(await Promise.all(rows.map(async (p) => {
       // fetch additional info
-      p.author = await siteDescriptions.getBest({subject: p.authorUrl})
+      var author = await siteDescriptions.getBest({subject: p.authorUrl})
 
       // massage attrs
-      p.url = p.authorUrl + p.pathname
-      delete p.authorUrl
-      delete p.pathname
-    }))
-  }
-  if (types.pages) {
-    searchResults.pages = await searchPublishedSites('web-page', {query, limit, offset, startHighlight, endHighlight, userCrawlSourceId, crawlSourceIds})
-  }
-  if (types.images) {
-    searchResults.images = await searchPublishedSites('image-collection', {query, limit, offset, startHighlight, endHighlight, userCrawlSourceId, crawlSourceIds})
+      return {
+        resultType: 'post',
+        url: p.authorUrl + p.pathname,
+        author,
+        content: {
+          url: p.url,
+          title: p.title,
+          description: p.description,
+          type: p.type.split(',')
+        },
+        crawledAt: p.crawledAt,
+        createdAt: p.createdAt,
+        updatedAt: p.updatedAt
+      }
+    })))
   }
-  if (types.files) {
-    searchResults.files = await searchPublishedSites('file-shares', {query, limit, offset, startHighlight, endHighlight, userCrawlSourceId, crawlSourceIds})
+  {
+    // SITES
+    let rows
+    if (query) {
+      rows = await db.all(`
+        SELECT
+            pub.url AS url,
+            pubSrc.url AS authorUrl,
+            SNIPPET(crawl_site_descriptions_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title,
+            SNIPPET(crawl_site_descriptions_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description,
+            desc.crawledAt
+          FROM crawl_site_descriptions_fts_index desc_fts
+          INNER JOIN crawl_site_descriptions desc ON desc.rowid = desc_fts.rowid
+          INNER JOIN crawl_published_sites pub ON pub.url = desc.url
+          INNER JOIN crawl_sources pubSrc ON pub.crawlSourceId = pubSrc.id
+          LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = pubSrc.url
+          WHERE
+            crawl_site_descriptions_fts_index MATCH ?
+            ${''/* TODO AND (',' || desc.type || ',') LIKE ?*/}
+            AND (fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) OR pubSrc.id = ?) -- site published by a me or a followed user
+            AND desc.crawledAt >= ?
+          ORDER BY desc.crawledAt
+          LIMIT ?
+          OFFSET ?;
+      `, [query, /*TODO `%,${type},%`,*/ userCrawlSourceId, since, limit, offset])
+    } else {
+      rows = await db.all(`
+        SELECT pub.url AS url, pubSrc.url AS authorUrl, desc.crawledAt
+          FROM crawl_published_sites pub
+          INNER JOIN crawl_site_descriptions desc ON desc.url = pub.url
+          INNER JOIN crawl_sources pubSrc ON pub.crawlSourceId = pubSrc.id
+          LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = pubSrc.url
+          WHERE 
+            ${''/* TODO (',' || desc.type || ',') LIKE ?
+            AND*/} (fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) OR pubSrc.id = ?) -- site published by a me or a followed user
+            AND desc.crawledAt >= ?
+          ORDER BY pub.crawledAt
+          LIMIT ?
+          OFFSET ?;
+      `, [/* TODO `%,${type},%`,*/ userCrawlSourceId, since, limit, offset])
+    }
+    rows = _uniqWith(rows, (a, b) => a.url === b.url) // remove duplicates
+    searchResults.results = searchResults.results.concat(await Promise.all(rows.map(async (row) => {
+      // fetch full records
+      var result = /**@type SiteSearchResult*/(await siteDescriptions.getBest({subject: row.url, author: row.authorUrl}))
+      result.resultType = 'site'
+      result.author = await siteDescriptions.getBest({subject: row.authorUrl})
+
+      // overwrite title and description so that highlighting can be included
+      if (row.title) result.title = row.title
+      if (row.description) result.description = row.description
+      return result
+    })))
   }
 
+  // sort and apply limit again
+  searchResults.results.sort((a, b) => b.crawledAt - a.crawledAt)
+  searchResults.results = searchResults.results.slice(0, limit)
+
   return searchResults
 }
-
-// internal methods
-// =
-
-async function searchPublishedSites (type, {query, limit, offset, startHighlight, endHighlight, userCrawlSourceId, crawlSourceIds}) {
-  var rows
-  if (query) {
-    rows = await db.all(`
-      SELECT
-          pub.url AS url,
-          pubSrc.url AS authorUrl,
-          SNIPPET(crawl_site_descriptions_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title,
-          SNIPPET(crawl_site_descriptions_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description
-        FROM crawl_site_descriptions_fts_index desc_fts
-        INNER JOIN crawl_site_descriptions desc ON desc.rowid = desc_fts.rowid
-        INNER JOIN crawl_published_sites pub ON pub.url = desc.url
-        INNER JOIN crawl_sources pubSrc ON pub.crawlSourceId = pubSrc.id
-        LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = pubSrc.url
-        WHERE
-          crawl_site_descriptions_fts_index MATCH ?
-          AND (',' || desc.type || ',') LIKE ?
-          AND (fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) OR pubSrc.id = ?) -- site published by a me or a followed user
-        ORDER BY rank
-        LIMIT ?
-        OFFSET ?;
-    `, [query, `%,${type},%`, userCrawlSourceId, limit, offset])
-  } else {
-    rows = await db.all(`
-      SELECT pub.url AS url, pubSrc.url AS authorUrl
-        FROM crawl_published_sites pub
-        INNER JOIN crawl_site_descriptions desc ON desc.url = pub.url
-        INNER JOIN crawl_sources pubSrc ON pub.crawlSourceId = pubSrc.id
-        LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = pubSrc.url
-        WHERE 
-          (',' || desc.type || ',') LIKE ?
-          AND (fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) OR pubSrc.id = ?) -- site published by a me or a followed user
-        ORDER BY pub.crawledAt
-        LIMIT ?
-        OFFSET ?;
-    `, [`%,${type},%`, userCrawlSourceId, limit, offset])
-  }
-  rows = _uniqWith(rows, (a, b) => a.url === b.url) // remove duplicates
-  return Promise.all(rows.map(async (row) => {
-    // fetch full records
-    var result = /**@type PageSearchResult*/(await siteDescriptions.getBest({subject: row.url, author: row.authorUrl}))
-    result.author = await siteDescriptions.getBest({subject: row.authorUrl})
-    // overwrite title and description so that highlighting can be included
-    if (row.title) result.title = row.title
-    if (row.description) result.description = row.description
-    return result
-  }))
-}
\ No newline at end of file
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index c5e15464..e1d6ce86 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -161,24 +161,27 @@ CREATE TABLE crawl_posts (
   pathname TEXT NOT NULL,
   crawledAt INTEGER,
 
-  content TEXT,
+  url TEXT,
+  title TEXT,
+  description TEXT,
+  type TEXT, -- comma separated strings
   createdAt INTEGER,
   updatedAt INTEGER,
 
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
-CREATE VIRTUAL TABLE crawl_posts_fts_index USING fts5(content, content='crawl_posts');
+CREATE VIRTUAL TABLE crawl_posts_fts_index USING fts5(title, description, content='crawl_posts');
 
 -- triggers to keep crawl_posts_fts_index updated
 CREATE TRIGGER crawl_posts_ai AFTER INSERT ON crawl_posts BEGIN
-  INSERT INTO crawl_posts_fts_index(rowid, content) VALUES (new.rowid, new.content);
+  INSERT INTO crawl_posts_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
 END;
 CREATE TRIGGER crawl_posts_ad AFTER DELETE ON crawl_posts BEGIN
-  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, content) VALUES('delete', old.rowid, old.content);
+  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
 END;
 CREATE TRIGGER crawl_posts_au AFTER UPDATE ON crawl_posts BEGIN
-  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, content) VALUES('delete', old.rowid, old.content);
-  INSERT INTO crawl_posts_fts_index(rowid, content) VALUES (new.rowid, new.content);
+  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
+  INSERT INTO crawl_posts_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
 END;
 
 -- crawled follows
diff --git a/dbs/schemas/profile-data.v24.sql.js b/dbs/schemas/profile-data.v24.sql.js
index 320de6cc..e0bbb480 100644
--- a/dbs/schemas/profile-data.v24.sql.js
+++ b/dbs/schemas/profile-data.v24.sql.js
@@ -57,24 +57,27 @@ CREATE TABLE crawl_posts (
   pathname TEXT NOT NULL,
   crawledAt INTEGER,
 
-  content TEXT,
+  url TEXT,
+  title TEXT,
+  description TEXT,
+  type TEXT, -- comma separated strings
   createdAt INTEGER,
   updatedAt INTEGER,
 
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
-CREATE VIRTUAL TABLE crawl_posts_fts_index USING fts5(content, content='crawl_posts');
+CREATE VIRTUAL TABLE crawl_posts_fts_index USING fts5(title, description, content='crawl_posts');
 
 -- triggers to keep crawl_posts_fts_index updated
 CREATE TRIGGER crawl_posts_ai AFTER INSERT ON crawl_posts BEGIN
-  INSERT INTO crawl_posts_fts_index(rowid, content) VALUES (new.rowid, new.content);
+  INSERT INTO crawl_posts_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
 END;
 CREATE TRIGGER crawl_posts_ad AFTER DELETE ON crawl_posts BEGIN
-  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, content) VALUES('delete', old.rowid, old.content);
+  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
 END;
 CREATE TRIGGER crawl_posts_au AFTER UPDATE ON crawl_posts BEGIN
-  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, content) VALUES('delete', old.rowid, old.content);
-  INSERT INTO crawl_posts_fts_index(rowid, content) VALUES (new.rowid, new.content);
+  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
+  INSERT INTO crawl_posts_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
 END;
 
 -- crawled follows
diff --git a/package-lock.json b/package-lock.json
index 8e7ae10f..037a9399 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -57,9 +57,9 @@
       }
     },
     "ajv": {
-      "version": "6.6.2",
-      "resolved": "https://registry.npmjs.org/ajv/-/ajv-6.6.2.tgz",
-      "integrity": "sha512-FBHEW6Jf5TB9MGBgUUA9XHkTbjXYfAUjY43ACMfmdMRHniyoMHjHjzD50OK8LGDWQwp4rWEsIq5kEqq7rvIM1g==",
+      "version": "6.7.0",
+      "resolved": "https://registry.npmjs.org/ajv/-/ajv-6.7.0.tgz",
+      "integrity": "sha512-RZXPviBTtfmtka9n9sy1N5M5b82CbxWIR6HIis4s3WQTXDJamc/0gpCWNGz6EWdWp4DOfjzJfhz/AS9zVPjjWg==",
       "requires": {
         "fast-deep-equal": "^2.0.1",
         "fast-json-stable-stringify": "^2.0.0",
@@ -775,13 +775,23 @@
       }
     },
     "dat-dns": {
-      "version": "3.0.2",
-      "resolved": "https://registry.npmjs.org/dat-dns/-/dat-dns-3.0.2.tgz",
-      "integrity": "sha512-TqkWQ03NvdLK9Rm9n11UCy59KnIsu82A0lPQYcMG02pYTU4xTxShzDryGO2orvmcT5063olmI1R9vKil0jw0Lw==",
+      "version": "3.1.0",
+      "resolved": "https://registry.npmjs.org/dat-dns/-/dat-dns-3.1.0.tgz",
+      "integrity": "sha512-QDh1+cMFX6qw4sncReWamb7qM6jrztB9Wri5YcKNhtYXxayHfFG2MC6ny8KovKPvz+7whP1A9lYzeZY0L0fO8Q==",
       "requires": {
         "call-me-maybe": "^1.0.1",
         "concat-stream": "^1.6.0",
-        "debug": "^2.6.1"
+        "debug": "^4.1.1"
+      },
+      "dependencies": {
+        "debug": {
+          "version": "4.1.1",
+          "resolved": "https://registry.npmjs.org/debug/-/debug-4.1.1.tgz",
+          "integrity": "sha512-pYAIzeRo8J6KPEaJ0VWOh5Pzkbw/RetuzehGM7QRRX5he4fPHx2rdKMB256ehJCkX+XRQm16eZLqLNS8RSZXZw==",
+          "requires": {
+            "ms": "^2.1.1"
+          }
+        }
       }
     },
     "dat-encoding": {
diff --git a/package.json b/package.json
index 8f31c3a5..3bc87855 100644
--- a/package.json
+++ b/package.json
@@ -28,6 +28,7 @@
     "@beaker/dat-ephemeral-ext-msg": "^1.0.0",
     "@beaker/dat-session-data-ext-msg": "^1.1.0",
     "@beaker/datignore": "^1.0.0",
+    "ajv": "^6.7.0",
     "anymatch": "^2.0.0",
     "await-lock": "^1.1.3",
     "beaker-error-constants": "^1.4.0",
diff --git a/web-apis/bg/posts.js b/web-apis/bg/posts.js
index ee3eeca4..8e0885e6 100644
--- a/web-apis/bg/posts.js
+++ b/web-apis/bg/posts.js
@@ -31,25 +31,23 @@ module.exports = {
     return post
   },
 
-  async create ({content} = {}) {
-    assert(typeof content === 'string', 'Create() must be provided a `content` string')
+  async create (content) {
     var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
     var userArchive = dat.library.getArchive(userSession.url)
-    return postsCrawler.create(userArchive, {content})
+    return postsCrawler.create(userArchive, content)
   },
 
-  async edit (pathname, {content} = {}) {
+  async edit (pathname, content) {
     assert(typeof pathname === 'string', 'Edit() must be provided a valid URL string')
-    assert(typeof content === 'string', 'Edit() must be provided a `content` string')
     var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
     var userArchive = dat.library.getArchive(userSession.url)
-    return postsCrawler.edit(userArchive, pathname, {content})
+    return postsCrawler.edit(userArchive, pathname, content)
   },
 
   async delete (pathname) {
-    assert(typeof pathname === 'string', 'Edit() must be provided a valid URL string')
+    assert(typeof pathname === 'string', 'Delete() must be provided a valid URL string')
     var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
     var userArchive = dat.library.getArchive(userSession.url)

From 30333d6c48e63d81cd09a25dc12414360c3a364d Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 24 Jan 2019 13:58:45 -0600
Subject: [PATCH 077/245] Formatting

---
 crawler/json-schemas/follows.js         | 44 ++++++-------
 crawler/json-schemas/post.js            | 86 ++++++++++++-------------
 crawler/json-schemas/published-sites.js | 42 ++++++------
 3 files changed, 86 insertions(+), 86 deletions(-)

diff --git a/crawler/json-schemas/follows.js b/crawler/json-schemas/follows.js
index 5c87fe85..62f38d53 100644
--- a/crawler/json-schemas/follows.js
+++ b/crawler/json-schemas/follows.js
@@ -1,30 +1,30 @@
 module.exports = {
-  "$schema": "http://json-schema.org/draft-07/schema#",
-  "$id": "dat://unwalled.garden/follows.json",
-  "type": "object",
-  "title": "Follows",
-  "description": " A list of data subscriptions.",
-  "required": [
-    "type",
-    "urls"
+  '$schema': 'http://json-schema.org/draft-07/schema#',
+  '$id': 'dat://unwalled.garden/follows.json',
+  'type': 'object',
+  'title': 'Follows',
+  'description': ' A list of data subscriptions.',
+  'required': [
+    'type',
+    'urls'
   ],
-  "properties": {
-    "type": {
-      "type": "string",
-      "title": "The object's type",
-      "const": "unwalled.garden/follows"
+  'properties': {
+    'type': {
+      'type': 'string',
+      'title': "The object's type",
+      'const': 'unwalled.garden/follows'
     },
-    "urls": {
-      "type": "array",
-      "title": "The followed URLs",
-      "items": {
-        "type": "string",
-        "format": "uri",
-        "examples": [
-          "dat://beakerbrowser.com"
+    'urls': {
+      'type': 'array',
+      'title': 'The followed URLs',
+      'items': {
+        'type': 'string',
+        'format': 'uri',
+        'examples': [
+          'dat://beakerbrowser.com'
         ]
       }
     }
   },
-  "additionalProperties": false
+  'additionalProperties': false
 }
\ No newline at end of file
diff --git a/crawler/json-schemas/post.js b/crawler/json-schemas/post.js
index 1884757b..11ccd073 100644
--- a/crawler/json-schemas/post.js
+++ b/crawler/json-schemas/post.js
@@ -1,59 +1,59 @@
 module.exports = {
-  "$schema": "http://json-schema.org/draft-07/schema#",
-  "$id": "dat://unwalled.garden/post.json",
-  "type": "object",
-  "title": "Post",
-  "description": "A short broadcast.",
-  "required": [
-    "type",
-    "content",
-    "createdAt"
+  '$schema': 'http://json-schema.org/draft-07/schema#',
+  '$id': 'dat://unwalled.garden/post.json',
+  'type': 'object',
+  'title': 'Post',
+  'description': 'A short broadcast.',
+  'required': [
+    'type',
+    'content',
+    'createdAt'
   ],
-  "properties": {
-    "type": {
-      "type": "string",
-      "title": "The object's type",
-      "const": "unwalled.garden/post"
+  'properties': {
+    'type': {
+      'type': 'string',
+      'title': "The object's type",
+      'const': 'unwalled.garden/post'
     },
-    "content": {
-      "type": "object",
-      "required": [
-        "url",
-        "title"
+    'content': {
+      'type': 'object',
+      'required': [
+        'url',
+        'title'
       ],
-      "properties": {
-        "url": {
-          "type": "string",
-          "title": "The post's target URL",
-          "format": "uri",
-          "examples": [
-            "dat://beakerbrowser.com"
+      'properties': {
+        'url': {
+          'type': 'string',
+          'title': "The post's target URL",
+          'format': 'uri',
+          'examples': [
+            'dat://beakerbrowser.com'
           ]
         },
-        "title": {
-          "type": "string"
+        'title': {
+          'type': 'string'
         },
-        "description": {
-          "type": "string"
+        'description': {
+          'type': 'string'
         },
-        "type": {
-          "type": "array",
-          "items": {
-            "type": "string"
+        'type': {
+          'type': 'array',
+          'items': {
+            'type': 'string'
           }
         }
       }
     },
-    "createdAt": {
-      "type": "string",
-      "format": "date-time",
-      "title": "The time of this post's creation"
+    'createdAt': {
+      'type': 'string',
+      'format': 'date-time',
+      'title': "The time of this post's creation"
     },
-    "updatedAt": {
-      "type": "string",
-      "format": "date-time",
-      "title": "The time of this post's last edit"
+    'updatedAt': {
+      'type': 'string',
+      'format': 'date-time',
+      'title': "The time of this post's last edit"
     }
   },
-  "additionalProperties": false
+  'additionalProperties': false
 }
\ No newline at end of file
diff --git a/crawler/json-schemas/published-sites.js b/crawler/json-schemas/published-sites.js
index 8aaea76a..7c0df325 100644
--- a/crawler/json-schemas/published-sites.js
+++ b/crawler/json-schemas/published-sites.js
@@ -1,29 +1,29 @@
 module.exports = {
-  "$schema": "http://json-schema.org/draft-07/schema#",
-  "$id": "dat://unwalled.garden/published-sites.json",
-  "type": "object",
-  "title": "Published sites",
-  "description": "Sites published by the user.",
-  "required": [
-    "type"
+  '$schema': 'http://json-schema.org/draft-07/schema#',
+  '$id': 'dat://unwalled.garden/published-sites.json',
+  'type': 'object',
+  'title': 'Published sites',
+  'description': 'Sites published by the user.',
+  'required': [
+    'type'
   ],
-  "properties": {
-    "type": {
-      "type": "string",
-      "title": "The object's type",
-      "const": "unwalled.garden/published-sites"
+  'properties': {
+    'type': {
+      'type': 'string',
+      'title': "The object's type",
+      'const': 'unwalled.garden/published-sites'
     },
-    "urls": {
-      "type": "array",
-      "title": "The followed URLs",
-      "items": {
-        "type": "string",
-        "format": "uri",
-        "examples": [
-          "dat://beakerbrowser.com"
+    'urls': {
+      'type': 'array',
+      'title': 'The followed URLs',
+      'items': {
+        'type': 'string',
+        'format': 'uri',
+        'examples': [
+          'dat://beakerbrowser.com'
         ]
       }
     }
   },
-  "additionalProperties": false
+  'additionalProperties': false
 }
\ No newline at end of file

From 9d764b72a26547632a09963250aef0351a8a1e00 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 24 Jan 2019 13:59:01 -0600
Subject: [PATCH 078/245] Temporary type filtering in search

---
 crawler/search.js | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/crawler/search.js b/crawler/search.js
index 95139188..a721688d 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -246,7 +246,7 @@ exports.listSearchResults = async function (opts) {
     }))
     searchResults.results = searchResults.results.concat(rows)
   }
-  {
+  if (type !== 'user') {
     // POSTS
     let rows
     if (query) {
@@ -317,7 +317,7 @@ exports.listSearchResults = async function (opts) {
       }
     })))
   }
-  {
+  if (type !== 'user') {
     // SITES
     let rows
     if (query) {

From 64f08b91fc87a66b2d4a1a85df218cf70bcf47b7 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 26 Jan 2019 22:41:54 -0600
Subject: [PATCH 079/245] Add scripts/import-schemas.js

---
 package-lock.json         |  8 ++++----
 package.json              |  1 +
 scripts/import-schemas.js | 35 +++++++++++++++++++++++++++++++++++
 3 files changed, 40 insertions(+), 4 deletions(-)
 create mode 100644 scripts/import-schemas.js

diff --git a/package-lock.json b/package-lock.json
index 037a9399..2f4c855a 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -3452,11 +3452,11 @@
       "integrity": "sha512-TTlYpa+OL+vMMNG24xSlQGEJ3B/RzEfUlLct7b5G/ytav+wPrplCpVMFuwzXbkecJrb6IYo1iFb0S9v37754mg=="
     },
     "rimraf": {
-      "version": "2.6.2",
-      "resolved": "https://registry.npmjs.org/rimraf/-/rimraf-2.6.2.tgz",
-      "integrity": "sha512-lreewLK/BlghmxtfH36YYVg1i8IAce4TI7oao75I1g245+6BctqTVQiBP3YUJ9C6DQOXJmkYR9X9fCLtCOJc5w==",
+      "version": "2.6.3",
+      "resolved": "https://registry.npmjs.org/rimraf/-/rimraf-2.6.3.tgz",
+      "integrity": "sha512-mwqeW5XsA2qAejG46gYdENaxXjx9onRNCfn7L0duuP4hCuTIi/QO7PDK07KJfp1d+izWPrzEJDcSqBa0OZQriA==",
       "requires": {
-        "glob": "^7.0.5"
+        "glob": "^7.1.3"
       }
     },
     "run-async": {
diff --git a/package.json b/package.json
index 3bc87855..f4f777f4 100644
--- a/package.json
+++ b/package.json
@@ -73,6 +73,7 @@
     "random-access-file": "^2.0.1",
     "random-access-indexed-file": "^2.0.0",
     "range-parser": "^1.2.0",
+    "rimraf": "^2.6.3",
     "scoped-fs": "^1.3.0",
     "semver": "^5.6.0",
     "slugify": "^1.3.4",
diff --git a/scripts/import-schemas.js b/scripts/import-schemas.js
new file mode 100644
index 00000000..764cd7fe
--- /dev/null
+++ b/scripts/import-schemas.js
@@ -0,0 +1,35 @@
+const path = require('path')
+const fs = require('fs')
+const childProcess = require('child_process')
+const rimraf = require('rimraf')
+
+const SCHEMAS = [
+  'comment',
+  'content',
+  'follows',
+  'link-post',
+  'micro-post',
+  'published-site'
+]
+
+console.log('')
+console.log('Cloning unwalled.garden')
+console.log('')
+var tmpdir = fs.mkdtempSync('unwalled-garden-')
+childProcess.execSync(`git clone https://github.com/beakerbrowser/unwalled.garden ${tmpdir}`)
+
+console.log('')
+console.log('Copying schema definitions')
+console.log('')
+for (let name of SCHEMAS) {
+  console.log(name)
+  var content = fs.readFileSync(path.join(tmpdir, name + '.json'))
+  fs.writeFileSync(path.join(__dirname, '../crawler/json-schemas/', name + '.js'), `module.exports = ${content}`)
+}
+
+console.log('')
+console.log('Removing tmpdir')
+console.log('')
+rimraf.sync(tmpdir)
+
+console.log('Done!')

From a369f56ca37ff6f6b003cd0b22259877e9520b95 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 26 Jan 2019 22:42:12 -0600
Subject: [PATCH 080/245] Update json schemas

---
 crawler/json-schemas/comment.js        | 51 ++++++++++++++++++++
 crawler/json-schemas/content.js        | 66 ++++++++++++++++++++++++++
 crawler/json-schemas/link-post.js      | 59 +++++++++++++++++++++++
 crawler/json-schemas/micro-post.js     | 35 ++++++++++++++
 crawler/json-schemas/published-site.js | 33 +++++++++++++
 5 files changed, 244 insertions(+)
 create mode 100644 crawler/json-schemas/comment.js
 create mode 100644 crawler/json-schemas/content.js
 create mode 100644 crawler/json-schemas/link-post.js
 create mode 100644 crawler/json-schemas/micro-post.js
 create mode 100644 crawler/json-schemas/published-site.js

diff --git a/crawler/json-schemas/comment.js b/crawler/json-schemas/comment.js
new file mode 100644
index 00000000..3e37dd7a
--- /dev/null
+++ b/crawler/json-schemas/comment.js
@@ -0,0 +1,51 @@
+module.exports = {
+  '$schema': 'http://json-schema.org/draft-07/schema#',
+  '$id': 'dat://unwalled.garden/comment.json',
+  'type': 'object',
+  'title': 'Comment',
+  'description': 'A text post about some resource.',
+  'required': [
+    'type',
+    'topic',
+    'content',
+    'createdAt'
+  ],
+  'properties': {
+    'type': {
+      'type': 'string',
+      'title': "The object's type",
+      'const': 'unwalled.garden/comment'
+    },
+    'topic': {
+      'type': 'string',
+      'title': 'What this comment is about',
+      'format': 'uri',
+      'examples': [
+        'dat://beakerbrowser.com'
+      ]
+    },
+    'replyTo': {
+      'type': 'string',
+      'title': 'What this comment is replying to',
+      'format': 'uri',
+      'examples': [
+        'dat://beakerbrowser.com'
+      ]
+    },
+    'content': {
+      'type': 'string',
+      'title': "The comment's content"
+    },
+    'createdAt': {
+      'type': 'string',
+      'format': 'date-time',
+      'title': "The time of this post's creation"
+    },
+    'updatedAt': {
+      'type': 'string',
+      'format': 'date-time',
+      'title': "The time of this post's last edit"
+    }
+  },
+  'additionalProperties': false
+}
\ No newline at end of file
diff --git a/crawler/json-schemas/content.js b/crawler/json-schemas/content.js
new file mode 100644
index 00000000..b1b898e8
--- /dev/null
+++ b/crawler/json-schemas/content.js
@@ -0,0 +1,66 @@
+module.exports = {
+  '$schema': 'http://json-schema.org/draft-07/schema#',
+  '$id': 'dat://unwalled.garden/content.json',
+  'type': 'object',
+  'title': 'Content',
+  'description': 'A description of media content.',
+  'required': [
+    'type'
+  ],
+  'properties': {
+    'type': {
+      'type': 'string',
+      'title': "The object's type",
+      'const': 'unwalled.garden/content'
+    },
+    'item': {
+      'type': 'object',
+      'required': [
+        'filename'
+      ],
+      'properties': {
+        'filename': {
+          'type': 'string',
+          'examples': [
+            'dat://beakerbrowser.com'
+          ]
+        },
+        'title': {
+          'type': 'string'
+        },
+        'description': {
+          'type': 'string'
+        }
+      }
+    },
+    'items': {
+      'type': 'array',
+      'items': {
+        'type': 'object',
+        'required': [
+          'filename'
+        ],
+        'properties': {
+          'filename': {
+            'type': 'string',
+            'examples': [
+              'dat://beakerbrowser.com'
+            ]
+          },
+          'title': {
+            'type': 'string'
+          },
+          'description': {
+            'type': 'string'
+          }
+        }
+      }
+    },
+    'createdAt': {
+      'type': 'string',
+      'format': 'date-time',
+      'title': "The time of this content's creation"
+    }
+  },
+  'additionalProperties': false
+}
\ No newline at end of file
diff --git a/crawler/json-schemas/link-post.js b/crawler/json-schemas/link-post.js
new file mode 100644
index 00000000..f210e65b
--- /dev/null
+++ b/crawler/json-schemas/link-post.js
@@ -0,0 +1,59 @@
+module.exports = {
+  '$schema': 'http://json-schema.org/draft-07/schema#',
+  '$id': 'dat://unwalled.garden/link-post.json',
+  'type': 'object',
+  'title': 'Link Post',
+  'description': 'A published link to some content.',
+  'required': [
+    'type',
+    'content',
+    'createdAt'
+  ],
+  'properties': {
+    'type': {
+      'type': 'string',
+      'title': "The object's type",
+      'const': 'unwalled.garden/link-post'
+    },
+    'content': {
+      'type': 'object',
+      'required': [
+        'url',
+        'title'
+      ],
+      'properties': {
+        'url': {
+          'type': 'string',
+          'title': "The post's target URL",
+          'format': 'uri',
+          'examples': [
+            'dat://beakerbrowser.com'
+          ]
+        },
+        'title': {
+          'type': 'string'
+        },
+        'description': {
+          'type': 'string'
+        },
+        'type': {
+          'type': 'array',
+          'items': {
+            'type': 'string'
+          }
+        }
+      }
+    },
+    'createdAt': {
+      'type': 'string',
+      'format': 'date-time',
+      'title': "The time of this post's creation"
+    },
+    'updatedAt': {
+      'type': 'string',
+      'format': 'date-time',
+      'title': "The time of this post's last edit"
+    }
+  },
+  'additionalProperties': false
+}
\ No newline at end of file
diff --git a/crawler/json-schemas/micro-post.js b/crawler/json-schemas/micro-post.js
new file mode 100644
index 00000000..713f2c44
--- /dev/null
+++ b/crawler/json-schemas/micro-post.js
@@ -0,0 +1,35 @@
+module.exports = {
+  '$schema': 'http://json-schema.org/draft-07/schema#',
+  '$id': 'dat://unwalled.garden/micro-post.json',
+  'type': 'object',
+  'title': 'Micro Post',
+  'description': 'A short text post.',
+  'required': [
+    'type',
+    'content',
+    'createdAt'
+  ],
+  'properties': {
+    'type': {
+      'type': 'string',
+      'title': "The object's type",
+      'const': 'unwalled.garden/micro-post'
+    },
+    'content': {
+      'type': 'string',
+      'title': "The post's content",
+      'maxLength': 280
+    },
+    'createdAt': {
+      'type': 'string',
+      'format': 'date-time',
+      'title': "The time of this post's creation"
+    },
+    'updatedAt': {
+      'type': 'string',
+      'format': 'date-time',
+      'title': "The time of this post's last edit"
+    }
+  },
+  'additionalProperties': false
+}
\ No newline at end of file
diff --git a/crawler/json-schemas/published-site.js b/crawler/json-schemas/published-site.js
new file mode 100644
index 00000000..9b1d775c
--- /dev/null
+++ b/crawler/json-schemas/published-site.js
@@ -0,0 +1,33 @@
+module.exports = {
+  '$schema': 'http://json-schema.org/draft-07/schema#',
+  '$id': 'dat://unwalled.garden/published-site.json',
+  'type': 'object',
+  'title': 'Published site',
+  'description': 'A site which has been published by the user.',
+  'required': [
+    'type',
+    'url',
+    'createdAt'
+  ],
+  'properties': {
+    'type': {
+      'type': 'string',
+      'title': "The object's type",
+      'const': 'unwalled.garden/published-sites'
+    },
+    'url': {
+      'type': 'string',
+      'title': "The published site's URL",
+      'format': 'uri',
+      'examples': [
+        'dat://beakerbrowser.com'
+      ]
+    },
+    'createdAt': {
+      'type': 'string',
+      'format': 'date-time',
+      'title': "The time of this site's publishing"
+    }
+  },
+  'additionalProperties': false
+}
\ No newline at end of file

From 4c9e042156e9e79f5dfbe6458caeaf54b71d6279 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 28 Jan 2019 12:10:24 -0600
Subject: [PATCH 081/245] Update crawler and apis to use new unwalled.garden
 schemas

---
 crawler/index.js                              |   6 +-
 crawler/json-schemas/post.js                  |  59 ----
 crawler/json-schemas/published-site.js        |   2 +-
 crawler/json-schemas/published-sites.js       |  29 --
 crawler/{posts.js => link-feed.js}            |  79 ++---
 crawler/published-sites.js                    | 276 +++++++++---------
 crawler/search.js                             |  12 +-
 crawler/util.js                               |  24 ++
 dbs/schemas/profile-data.sql.js               |  25 +-
 dbs/schemas/profile-data.v24.sql.js           |  23 +-
 web-apis/bg.js                                |   6 +-
 web-apis/bg/{posts.js => link-feed.js}        |  12 +-
 web-apis/fg/beaker.js                         |  18 +-
 .../internal/{posts.js => link-feed.js}       |   0
 14 files changed, 243 insertions(+), 328 deletions(-)
 delete mode 100644 crawler/json-schemas/post.js
 delete mode 100644 crawler/json-schemas/published-sites.js
 rename crawler/{posts.js => link-feed.js} (81%)
 rename web-apis/bg/{posts.js => link-feed.js} (84%)
 rename web-apis/manifests/internal/{posts.js => link-feed.js} (100%)

diff --git a/crawler/index.js b/crawler/index.js
index 1bfb0446..f826eb96 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -7,7 +7,7 @@ const archivesDb = require('../dbs/archives')
 const dat = require('../dat')
 
 const {crawlerEvents, toHostname} = require('./util')
-const posts = require('./posts')
+const linkFeed = require('./link-feed')
 const followgraph = require('./followgraph')
 const publishedSites = require('./published-sites')
 const siteDescriptions = require('./site-descriptions')
@@ -20,7 +20,7 @@ var watches = {}
 // exported api
 // =
 
-exports.posts = posts
+exports.linkFeed = linkFeed
 exports.followgraph = followgraph
 exports.publishedSites = publishedSites
 exports.siteDescriptions = siteDescriptions
@@ -80,7 +80,7 @@ exports.crawlSite = async function (archive) {
 
     // crawl individual sources
     await Promise.all([
-      posts.crawlSite(archive, crawlSource),
+      linkFeed.crawlSite(archive, crawlSource),
       followgraph.crawlSite(archive, crawlSource),
       publishedSites.crawlSite(archive, crawlSource),
       siteDescriptions.crawlSite(archive, crawlSource)
diff --git a/crawler/json-schemas/post.js b/crawler/json-schemas/post.js
deleted file mode 100644
index 11ccd073..00000000
--- a/crawler/json-schemas/post.js
+++ /dev/null
@@ -1,59 +0,0 @@
-module.exports = {
-  '$schema': 'http://json-schema.org/draft-07/schema#',
-  '$id': 'dat://unwalled.garden/post.json',
-  'type': 'object',
-  'title': 'Post',
-  'description': 'A short broadcast.',
-  'required': [
-    'type',
-    'content',
-    'createdAt'
-  ],
-  'properties': {
-    'type': {
-      'type': 'string',
-      'title': "The object's type",
-      'const': 'unwalled.garden/post'
-    },
-    'content': {
-      'type': 'object',
-      'required': [
-        'url',
-        'title'
-      ],
-      'properties': {
-        'url': {
-          'type': 'string',
-          'title': "The post's target URL",
-          'format': 'uri',
-          'examples': [
-            'dat://beakerbrowser.com'
-          ]
-        },
-        'title': {
-          'type': 'string'
-        },
-        'description': {
-          'type': 'string'
-        },
-        'type': {
-          'type': 'array',
-          'items': {
-            'type': 'string'
-          }
-        }
-      }
-    },
-    'createdAt': {
-      'type': 'string',
-      'format': 'date-time',
-      'title': "The time of this post's creation"
-    },
-    'updatedAt': {
-      'type': 'string',
-      'format': 'date-time',
-      'title': "The time of this post's last edit"
-    }
-  },
-  'additionalProperties': false
-}
\ No newline at end of file
diff --git a/crawler/json-schemas/published-site.js b/crawler/json-schemas/published-site.js
index 9b1d775c..49c095e7 100644
--- a/crawler/json-schemas/published-site.js
+++ b/crawler/json-schemas/published-site.js
@@ -13,7 +13,7 @@ module.exports = {
     'type': {
       'type': 'string',
       'title': "The object's type",
-      'const': 'unwalled.garden/published-sites'
+      'const': 'unwalled.garden/published-site'
     },
     'url': {
       'type': 'string',
diff --git a/crawler/json-schemas/published-sites.js b/crawler/json-schemas/published-sites.js
deleted file mode 100644
index 7c0df325..00000000
--- a/crawler/json-schemas/published-sites.js
+++ /dev/null
@@ -1,29 +0,0 @@
-module.exports = {
-  '$schema': 'http://json-schema.org/draft-07/schema#',
-  '$id': 'dat://unwalled.garden/published-sites.json',
-  'type': 'object',
-  'title': 'Published sites',
-  'description': 'Sites published by the user.',
-  'required': [
-    'type'
-  ],
-  'properties': {
-    'type': {
-      'type': 'string',
-      'title': "The object's type",
-      'const': 'unwalled.garden/published-sites'
-    },
-    'urls': {
-      'type': 'array',
-      'title': 'The followed URLs',
-      'items': {
-        'type': 'string',
-        'format': 'uri',
-        'examples': [
-          'dat://beakerbrowser.com'
-        ]
-      }
-    }
-  },
-  'additionalProperties': false
-}
\ No newline at end of file
diff --git a/crawler/posts.js b/crawler/link-feed.js
similarity index 81%
rename from crawler/posts.js
rename to crawler/link-feed.js
index 5c0314da..0a5ce5d5 100644
--- a/crawler/posts.js
+++ b/crawler/link-feed.js
@@ -2,19 +2,19 @@ const assert = require('assert')
 const {URL} = require('url')
 const Events = require('events')
 const Ajv = require('ajv')
-const logger = require('../logger').child({category: 'crawler', dataset: 'posts'})
+const logger = require('../logger').child({category: 'crawler', dataset: 'link-posts'})
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
 const siteDescriptions = require('./site-descriptions')
-const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename} = require('./util')
-const postSchema = require('./json-schemas/post')
+const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename, ensureDirectory, toOrigin} = require('./util')
+const linkPostSchema = require('./json-schemas/link-post')
 
 // constants
 // =
 
 const TABLE_VERSION = 1
-const JSON_TYPE = 'unwalled.garden/post'
-const JSON_PATH_REGEX = /^\/data\/posts\/([^/]+)\.json$/i
+const JSON_TYPE = 'unwalled.garden/link-post'
+const JSON_PATH_REGEX = /^\/data\/link-feed\/([^/]+)\.json$/i
 
 // typedefs
 // =
@@ -42,8 +42,8 @@ const JSON_PATH_REGEX = /^\/data\/posts\/([^/]+)\.json$/i
 
 const events = new Events()
 const ajv = (new Ajv())
-const validatePost = ajv.compile(postSchema)
-const validatePostContent = ajv.compile(postSchema.properties.content)
+const validateLinkPost = ajv.compile(linkPostSchema)
+const validateLinkPostContent = ajv.compile(linkPostSchema.properties.content)
 
 // exported api
 // =
@@ -61,16 +61,16 @@ exports.removeListener = events.removeListener.bind(events)
  * @returns {Promise}
  */
 exports.crawlSite = async function (archive, crawlSource) {
-  return doCrawl(archive, crawlSource, 'crawl_posts', TABLE_VERSION, async ({changes, resetRequired}) => {
+  return doCrawl(archive, crawlSource, 'crawl_link_posts', TABLE_VERSION, async ({changes, resetRequired}) => {
     const supressEvents = resetRequired === true // dont emit when replaying old info
     logger.silly('Crawling posts', {details: {url: archive.url, numChanges: changes.length, resetRequired}})
     if (resetRequired) {
       // reset all data
       logger.debug('Resetting dataset', {details: {url: archive.url}})
       await db.run(`
-        DELETE FROM crawl_posts WHERE crawlSourceId = ?
+        DELETE FROM crawl_link_posts WHERE crawlSourceId = ?
       `, [crawlSource.id])
-      await doCheckpoint('crawl_posts', TABLE_VERSION, crawlSource, 0)
+      await doCheckpoint('crawl_link_posts', TABLE_VERSION, crawlSource, 0)
     }
 
     // collect changed posts
@@ -80,7 +80,7 @@ exports.crawlSite = async function (archive, crawlSource) {
     } else {
       logger.debug('No new post-files found', {details: {url: archive.url}})
     }
-    emitProgressEvent(archive.url, 'crawl_posts', 0, changedPosts.length)
+    emitProgressEvent(archive.url, 'crawl_link_posts', 0, changedPosts.length)
 
     // read and apply each post in order
     var progress = 0
@@ -92,7 +92,7 @@ exports.crawlSite = async function (archive, crawlSource) {
       if (changedPost.type === 'del') {
         // delete
         await db.run(`
-          DELETE FROM crawl_posts WHERE crawlSourceId = ? AND pathname = ?
+          DELETE FROM crawl_link_posts WHERE crawlSourceId = ? AND pathname = ?
         `, [crawlSource.id, changedPost.name])
         events.emit('post-removed', archive.url)
       } else {
@@ -109,8 +109,8 @@ exports.crawlSite = async function (archive, crawlSource) {
         let post
         try {
           post = JSON.parse(postString)
-          let valid = validatePost(post)
-          if (!valid) throw ajv.errorsText(validatePost.errors)
+          let valid = validateLinkPost(post)
+          if (!valid) throw ajv.errorsText(validateLinkPost.errors)
         } catch (err) {
           logger.warn('Failed to parse post file, skipping', {details: {url: archive.url, name: changedPost.name, err}})
           continue // skip
@@ -127,14 +127,14 @@ exports.crawlSite = async function (archive, crawlSource) {
         let existingPost = await get(archive.url, changedPost.name)
         if (existingPost) {
           await db.run(`
-            UPDATE crawl_posts
+            UPDATE crawl_link_posts
               SET crawledAt = ?, url = ?, title = ?, description = ?, type = ?, createdAt = ?, updatedAt = ?
               WHERE crawlSourceId = ? AND pathname = ?
           `, [Date.now(), post.content.url, post.content.title, post.content.description, post.content.type, post.createdAt, post.updatedAt, crawlSource.id, changedPost.name])
           events.emit('post-updated', archive.url)
         } else {
           await db.run(`
-            INSERT INTO crawl_posts (crawlSourceId, pathname, crawledAt, url, title, description, type, createdAt, updatedAt)
+            INSERT INTO crawl_link_posts (crawlSourceId, pathname, crawledAt, url, title, description, type, createdAt, updatedAt)
               VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?)
           `, [crawlSource.id, changedPost.name, Date.now(), post.content.url, post.content.title, post.content.description, post.content.type, post.createdAt, post.updatedAt])
           events.emit('post-added', archive.url)
@@ -143,8 +143,8 @@ exports.crawlSite = async function (archive, crawlSource) {
 
       // checkpoint our progress
       logger.silly(`Finished crawling posts`, {details: {url: archive.url}})
-      await doCheckpoint('crawl_posts', TABLE_VERSION, crawlSource, changedPost.version)
-      emitProgressEvent(archive.url, 'crawl_posts', ++progress, changedPosts.length)
+      await doCheckpoint('crawl_link_posts', TABLE_VERSION, crawlSource, changedPost.version)
+      emitProgressEvent(archive.url, 'crawl_link_posts', ++progress, changedPosts.length)
     }
   })
 }
@@ -180,8 +180,8 @@ exports.list = async function ({offset, limit, reverse, author, authors} = {}) {
 
   // build query
   var query = `
-    SELECT crawl_posts.*, src.url AS crawlSourceUrl FROM crawl_posts
-      INNER JOIN crawl_sources src ON src.id = crawl_posts.crawlSourceId
+    SELECT crawl_link_posts.*, src.url AS crawlSourceUrl FROM crawl_link_posts
+      INNER JOIN crawl_sources src ON src.id = crawl_link_posts.crawlSourceId
   `
   var values = []
   if (authors) {
@@ -230,13 +230,13 @@ const get = exports.get = async function (url, pathname = undefined) {
   // execute query
   return await massagePostRow(await db.get(`
     SELECT
-        crawl_posts.*, src.url AS crawlSourceUrl
-      FROM crawl_posts
+        crawl_link_posts.*, src.url AS crawlSourceUrl
+      FROM crawl_link_posts
       INNER JOIN crawl_sources src
-        ON src.id = crawl_posts.crawlSourceId
+        ON src.id = crawl_link_posts.crawlSourceId
         AND src.url = ?
       WHERE
-        crawl_posts.pathname = ?
+        crawl_link_posts.pathname = ?
   `, [urlParsed.origin, pathname]))
 }
 
@@ -253,12 +253,12 @@ const get = exports.get = async function (url, pathname = undefined) {
  * @returns {Promise}
  */
 exports.create = async function (archive, content) {
-  var valid = validatePostContent(content)
-  if (!valid) throw ajv.errorsText(validatePostContent.errors)
+  var valid = validateLinkPostContent(content)
+  if (!valid) throw ajv.errorsText(validateLinkPostContent.errors)
     var filename = generateTimeFilename()
   await ensureDirectory(archive, '/data')
-  await ensureDirectory(archive, '/data/posts')
-  await archive.pda.writeFile(`/data/posts/${filename}.json`, JSON.stringify({
+  await ensureDirectory(archive, '/data/link-feed')
+  await archive.pda.writeFile(`/data/link-feed/${filename}.json`, JSON.stringify({
     type: JSON_TYPE,
     content,
     createdAt: (new Date()).toISOString()
@@ -280,8 +280,8 @@ exports.create = async function (archive, content) {
  * @returns {Promise}
  */
 exports.edit = async function (archive, pathname, content) {
-  var valid = validatePostContent(content)
-  if (!valid) throw ajv.errorsText(validatePostContent.errors)
+  var valid = validateLinkPostContent(content)
+  if (!valid) throw ajv.errorsText(validateLinkPostContent.errors)
   var oldJson = JSON.parse(await archive.pda.readFile(pathname))
   await archive.pda.writeFile(pathname, JSON.stringify({
     type: JSON_TYPE,
@@ -317,25 +317,6 @@ function isString (v) {
   return typeof v === 'string'
 }
 
-/**
- * @param {string} url
- * @returns {string}
- */
-function toOrigin (url) {
-  var urlParsed = new URL(url)
-  return urlParsed.protocol + '//' + urlParsed.hostname
-}
-
-/**
- * @param {InternalDatArchive} archive
- * @param {string} pathname
- * @returns {Promise}
- */
-async function ensureDirectory (archive, pathname) {
-  try { await archive.pda.mkdir(pathname) }
-  catch (e) { /* ignore */ }
-}
-
 /**
  * @param {Object} row
  * @returns {Promise<Post>}
diff --git a/crawler/published-sites.js b/crawler/published-sites.js
index 987f239b..6e066a5e 100644
--- a/crawler/published-sites.js
+++ b/crawler/published-sites.js
@@ -1,22 +1,19 @@
 const assert = require('assert')
-const _difference = require('lodash.difference')
 const Events = require('events')
-const {URL} = require('url')
 const Ajv = require('ajv')
 const logger = require('../logger').child({category: 'crawler', dataset: 'published-sites'})
-const lock = require('../lib/lock')
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
 const siteDescriptions = require('./site-descriptions')
-const {doCrawl, doCheckpoint, emitProgressEvent} = require('./util')
-const publishedSitesSchema = require('./json-schemas/published-sites')
+const {doCrawl, doCheckpoint, emitProgressEvent, toOrigin, toHostname, ensureDirectory, getMatchingChangesInOrder} = require('./util')
+const publishedSiteSchema = require('./json-schemas/published-site')
 
 // constants
 // =
 
 const TABLE_VERSION = 1
-const JSON_TYPE = 'unwalled.garden/published-sites'
-const JSON_PATH = '/data/sites.json'
+const JSON_TYPE = 'unwalled.garden/published-site'
+const JSON_PATH_REGEX = /^\/data\/published-sites\/([^/]+)\.json$/i
 
 // typedefs
 // =
@@ -29,6 +26,13 @@ const JSON_PATH = '/data/sites.json'
  * @typedef {Object} PublishedSites
  * @prop {SiteDescription} author
  * @prop {SiteDescription[]} sites
+ * 
+ * @typedef {Object} PublishedSite
+ * @prop {string} pathname
+ * @prop {string} url
+ * @prop {number} crawledAt
+ * @prop {number} createdAt
+ * @prop {SiteDescription} author
  */
 
 // globals
@@ -36,7 +40,7 @@ const JSON_PATH = '/data/sites.json'
 
 const events = new Events()
 const ajv = (new Ajv())
-const validatePublishedSites = ajv.compile(publishedSitesSchema)
+const validatePublishedSite = ajv.compile(publishedSiteSchema)
 
 // exported api
 // =
@@ -66,82 +70,91 @@ exports.crawlSite = async function (archive, crawlSource) {
       await doCheckpoint('crawl_published_sites', TABLE_VERSION, crawlSource, 0)
     }
 
-    // did sites.json change?
-    var change = changes.find(c => c.name === JSON_PATH)
-    if (!change) {
-      logger.debug('No change detected to published-sites record', {details: {url: archive.url}})
-      if (changes.length) {
-        await doCheckpoint('crawl_published_sites', TABLE_VERSION, crawlSource, changes[changes.length - 1].version)
-      }
-      return
+    // collect changed site-records
+    var changedSites = getMatchingChangesInOrder(changes, JSON_PATH_REGEX)
+    if (changedSites.length) {
+      logger.verbose('Collected new/changed published-site files', {details: {url: archive.url, changedSites: changedSites.map(p => p.name)}})
+    } else {
+      logger.debug('No new published-site files found', {details: {url: archive.url}})
     }
+    emitProgressEvent(archive.url, 'crawl_published_sites', 0, changedSites.length)
 
-    logger.verbose('Change detected to published-sites record', {details: {url: archive.url}})
-    emitProgressEvent(archive.url, 'crawl_published_sites', 0, 1)
+    // read and apply each published-site in order
+    var progress = 0
+    for (let changedSite of changedSites) {
+      // TODO Currently the crawler will abort reading the feed if any published-site fails to load
+      //      this means that a single unreachable file can stop the forward progress of published-site indexing
+      //      to solve this, we need to find a way to tolerate unreachable published-site-files without losing our ability to efficiently detect new published-sites
+      //      -prf
+      if (changedSite.type === 'del') {
+        // delete
+        await db.run(`
+          DELETE FROM crawl_published_sites WHERE crawlSourceId = ? AND pathname = ?
+        `, [crawlSource.id, changedSite.name])
+        events.emit('published-site-removed', archive.url)
+      } else {
+        // read
+        let publishedSiteStr
+        try {
+          publishedSiteStr = await archive.pda.readFile(changedSite.name, 'utf8')
+        } catch (err) {
+          logger.warn('Failed to read published-site file, aborting', {details: {url: archive.url, name: changedSite.name, err}})
+          return // abort indexing
+        }
 
-    // read and validate
-    try {
-      var sitesJson = await readSitesFile(archive)
-    } catch (err) {
-      logger.warn('Failed to read published-sites file', {details: {url: archive.url, err}})
-      return
-    }
+        // parse and validate
+        let publishedSite
+        try {
+          publishedSite = JSON.parse(publishedSiteStr)
+          let valid = validatePublishedSite(publishedSite)
+          if (!valid) throw ajv.errorsText(validatePublishedSite.errors)
+        } catch (err) {
+          logger.warn('Failed to parse post file, skipping', {details: {url: archive.url, name: changedSite.name, err}})
+          continue // skip
+        }
 
-    // diff against the current sites
-    var currentPublishedSites = /** @type string[] */(await listPublishedSites(archive.url))
-    var newSites = sitesJson.urls
-    var adds = _difference(newSites, currentPublishedSites)
-    var removes = _difference(currentPublishedSites, newSites)
-    logger.silly(`Adding ${adds.length} sites and removing ${removes.length} sites`, {details: {url: archive.url}})
+        // massage the published-site
+        publishedSite.createdAt = Number(new Date(publishedSite.createdAt))
 
-    // write updates
-    for (let add of adds) {
-      try {
-        await db.run(`
-          INSERT INTO crawl_published_sites (crawlSourceId, url, isConfirmedAuthor, crawledAt) VALUES (?, ?, ?, ?)
-        `, [crawlSource.id, add, 0, Date.now()])
-      } catch (e) {
-        if (e.code === 'SQLITE_CONSTRAINT') {
-          // uniqueness constraint probably failed, which means we got a duplicate somehow
-          // dont worry about it
-          logger.warn('Attempted to insert duplicate published-site record', {details: {url: archive.url, add}})
+        // upsert
+        let existingPost = await get(archive.url, changedSite.name)
+        if (existingPost) {
+          await db.run(`
+            UPDATE crawl_published_sites
+              SET crawledAt = ?, url = ?, createdAt = ?
+              WHERE crawlSourceId = ? AND pathname = ?
+          `, [Date.now(), publishedSite.url, publishedSite.createdAt, crawlSource.id, changedSite.name])
+          events.emit('published-site-updated', archive.url)
         } else {
-          throw e
+          await db.run(`
+            INSERT INTO crawl_published_sites (crawlSourceId, pathname, crawledAt, url, createdAt)
+              VALUES (?, ?, ?, ?, ?)
+          `, [crawlSource.id, changedSite.name, Date.now(), publishedSite.url, publishedSite.createdAt])
+          events.emit('published-site-added', archive.url)
         }
       }
-      if (!supressEvents) {
-        events.emit('published-site-added', archive.url, add)
-      }
-    }
-    for (let remove of removes) {
-      await db.run(`
-        DELETE FROM crawl_published_sites WHERE crawlSourceId = ? AND url = ?
-      `, [crawlSource.id, remove])
-      if (supressEvents) {
-        events.emit('published-site-removed', archive.url, remove)
-      }
-    }
 
-    // write checkpoint as success
-    logger.silly(`Finished crawling published sites`, {details: {url: archive.url}})
-    await doCheckpoint('crawl_published_sites', TABLE_VERSION, crawlSource, changes[changes.length - 1].version)
-    emitProgressEvent(archive.url, 'crawl_published_sites', 1, 1)
+      // checkpoint our progress
+      logger.silly(`Finished crawling published-sites`, {details: {url: archive.url}})
+      await doCheckpoint('crawl_published_sites', TABLE_VERSION, crawlSource, changedSite.version)
+      emitProgressEvent(archive.url, 'crawl_published_sites', ++progress, changedSites.length)
+    }
   })
 }
 
 /**
  * @description
- * List sites published by subject.
+ * List sites published by publisher.
  *
- * @param {string} subject - (URL)
+ * @param {string} publisher - (URL)
  * @param {Object} [opts]
  * @param {string} [opts.type] - filter to the given type.
  * @param {boolean} [opts.includeDesc] - output a site description instead of a simple URL.
  * @returns {Promise<Array<string|SiteDescription>>}
  */
-const listPublishedSites = exports.listPublishedSites = async function (subject, {type, includeDesc} = {}) {
+const listPublishedSites = exports.listPublishedSites = async function (publisher, {type, includeDesc} = {}) {
   var WHERE = ''
-  var queryParams = [subject]
+  var queryParams = [publisher]
   if (type) {
     WHERE = `WHERE (',' || type || ',') LIKE ?`
     queryParams.push(`%,${type},%`)
@@ -185,6 +198,36 @@ const isAPublishedByB = exports.isAPublishedByB = async function (a, b) {
   return !!res
 }
 
+/**
+ * @description
+ * Get crawled published-site.
+ *
+ * @param {string} url - The URL of the published-site or of the author (if pathname is provided).
+ * @param {string} [pathname] - The pathname of the published-site.
+ * @returns {Promise<PublishedSite>}
+ */
+const get = exports.get = async function (url, pathname = undefined) {
+  // validate & parse params
+  var urlParsed
+  if (url) {
+    try { urlParsed = new URL(url) }
+    catch (e) { throw new Error('Failed to parse published-site URL: ' + url) }
+  }
+  pathname = pathname || urlParsed.pathname
+
+  // execute query
+  return await massagePublishedSiteRow(await db.get(`
+    SELECT
+        crawl_published_sites.*, src.url AS crawlSourceUrl
+      FROM crawl_published_sites
+      INNER JOIN crawl_sources src
+        ON src.id = crawl_published_sites.crawlSourceId
+        AND src.url = ?
+      WHERE
+        crawl_published_sites.pathname = ?
+  `, [urlParsed.origin, pathname]))
+}
+
 /**
  * @description
  * Add a published site to the given archive.
@@ -195,15 +238,18 @@ const isAPublishedByB = exports.isAPublishedByB = async function (a, b) {
  */
 exports.publishSite = async function (archive, siteUrl) {
   // normalize siteUrl
-  siteUrl = toOrigin(siteUrl)
-  assert(typeof siteUrl === 'string', 'publishSite() must be given a valid URL')
+  var siteOrigin = toOrigin(siteUrl)
+  var siteHostname = toHostname(siteUrl)
+  assert(typeof siteOrigin === 'string', 'publishSite() must be given a valid URL')
 
-  // write new follows.json
-  await updateSitesFile(archive, sitesJson => {
-    if (!sitesJson.urls.find(v => v === siteUrl)) {
-      sitesJson.urls.push(siteUrl)
-    }
-  })
+  await ensureDirectory(archive, '/data')
+  await ensureDirectory(archive, '/data/published-sites')
+  await archive.pda.writeFile(`/data/published-sites/${siteHostname}.json`, JSON.stringify({
+    type: JSON_TYPE,
+    url: siteOrigin,
+    createdAt: (new Date()).toISOString()
+  }))
+  await crawler.crawlSite(archive)
 
   // capture site description
   /* dont await */siteDescriptions.capture(archive, siteUrl)
@@ -219,84 +265,30 @@ exports.publishSite = async function (archive, siteUrl) {
  */
 exports.unpublishSite = async function (archive, siteUrl) {
   // normalize siteUrl
-  siteUrl = toOrigin(siteUrl)
-  assert(typeof siteUrl === 'string', 'unpublishSite() must be given a valid URL')
+  var siteHostname = toHostname(siteUrl)
+  assert(typeof siteHostname === 'string', 'unpublishSite() must be given a valid URL')
 
-  // write new follows.json
-  await updateSitesFile(archive, sitesJson => {
-    var i = sitesJson.urls.findIndex(v => v === siteUrl)
-    if (i !== -1) {
-      sitesJson.urls.splice(i, 1)
-    }
-  })
+  // remove the file
+  await archive.pda.unlink(`/data/published-sites/${siteHostname}.json`)
+  await crawler.crawlSite(archive)
 }
 
 // internal methods
 // =
 
 /**
- * @param {string} url
- * @returns {string}
- */
-function toOrigin (url) {
-  try {
-    var urlParsed = new URL(url)
-    return urlParsed.protocol + '//' + urlParsed.hostname
-  } catch (e) {
-    return null
-  }
-}
-
-/**
- * @param {InternalDatArchive} archive
- * @returns {Promise<Object>}
- */
-async function readSitesFile (archive) {
-  try {
-    var sitesJson = await archive.pda.readFile(JSON_PATH, 'utf8')
-  } catch (e) {
-    if (e.notFound) return {type: JSON_TYPE, urls: []} // empty default when not found
-    throw e
-  }
-  sitesJson = JSON.parse(sitesJson)
-  var valid = validatePublishedSites(sitesJson)
-  if (!valid) throw ajv.errorsText(validatePublishedSites.errors)
-  return sitesJson
-}
-
-/**
- * @param {InternalDatArchive} archive
- * @param {function(Object): void} updateFn
- * @returns {Promise<void>}
+ * @param {Object} row
+ * @returns {Promise<PublishedSite>}
  */
-async function updateSitesFile (archive, updateFn) {
-  var release = await lock('crawler:published-sites:' + archive.url)
-  try {
-    // read the follows file
-    try {
-      var sitesJson = await readSitesFile(archive)
-    } catch (err) {
-      if (err.notFound) {
-        // create new
-        sitesJson = {
-          type: JSON_TYPE,
-          urls: []
-        }
-      } else {
-        logger.warn('Failed to read published-sites file', {details: {url: archive.url, err}})
-        throw err
-      }
-    }
-
-    // apply update
-    updateFn(sitesJson)
-
-    // write the follows file
-    await archive.pda.writeFile(JSON_PATH, JSON.stringify(sitesJson), 'utf8')
-
-    // trigger crawl now
-    await crawler.crawlSite(archive)
-  } finally {
-    release()
+async function massagePublishedSiteRow (row) {
+  if (!row) return null
+  var author = await siteDescriptions.getBest({subject: row.crawlSourceUrl})
+  if (!author) author = {url: row.crawlSourceUrl}
+  return {
+    pathname: row.pathname,
+    author,
+    url: row.url,
+    crawledAt: row.crawledAt,
+    createdAt: row.createdAt
   }
 }
diff --git a/crawler/search.js b/crawler/search.js
index a721688d..4fb91399 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -253,20 +253,20 @@ exports.listSearchResults = async function (opts) {
       rows = await db.all(`
         SELECT
             post.url,
-            SNIPPET(crawl_posts_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title,
-            SNIPPET(crawl_posts_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description,
+            SNIPPET(crawl_link_posts_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title,
+            SNIPPET(crawl_link_posts_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description,
             post.type,
             post.pathname,
             post.crawledAt,
             post.createdAt,
             post.updatedAt,
             postSrc.url AS authorUrl
-          FROM crawl_posts_fts_index post_fts
-          INNER JOIN crawl_posts post ON post.rowid = post_fts.rowid
+          FROM crawl_link_posts_fts_index post_fts
+          INNER JOIN crawl_link_posts post ON post.rowid = post_fts.rowid
           INNER JOIN crawl_sources postSrc ON post.crawlSourceId = postSrc.id
           LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = postSrc.url 
           WHERE
-            crawl_posts_fts_index MATCH ?
+            crawl_link_posts_fts_index MATCH ?
             AND (fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) OR post.crawlSourceId = ?)
             AND post.crawledAt >= ?
           ORDER BY post.crawledAt
@@ -285,7 +285,7 @@ exports.listSearchResults = async function (opts) {
             post.createdAt,
             post.updatedAt,
             postSrc.url AS authorUrl
-          FROM crawl_posts post
+          FROM crawl_link_posts post
           INNER JOIN crawl_sources postSrc ON post.crawlSourceId = postSrc.id
           LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = postSrc.url 
           WHERE
diff --git a/crawler/util.js b/crawler/util.js
index 19582a4b..670f2eaa 100644
--- a/crawler/util.js
+++ b/crawler/util.js
@@ -140,6 +140,30 @@ exports.toHostname = function (url) {
   return urlParsed.hostname
 }
 
+/**
+ * @param {string} url
+ * @returns {string}
+ */
+const toOrigin =
+exports.toOrigin = function (url) {
+  try {
+    var urlParsed = new URL(url)
+    return urlParsed.protocol + '//' + urlParsed.hostname
+  } catch (e) {
+    return null
+  }
+}
+
+/**
+ * @param {InternalDatArchive} archive
+ * @param {string} pathname
+ * @returns {Promise}
+ */
+exports.ensureDirectory = async function (archive, pathname) {
+  try { await archive.pda.mkdir(pathname) }
+  catch (e) { /* ignore */ }
+}
+
 /**
  * @description Helper to determine the thumbUrl for a site description.
  * @param {string} author - (URL) the author of the site description.
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index e1d6ce86..02cb7f1a 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -155,8 +155,8 @@ CREATE TRIGGER crawl_site_descriptions_au AFTER UPDATE ON crawl_site_description
   INSERT INTO crawl_site_descriptions_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
 END;
 
--- crawled posts
-CREATE TABLE crawl_posts (
+-- crawled link-posts
+CREATE TABLE crawl_link_posts (
   crawlSourceId INTEGER NOT NULL,
   pathname TEXT NOT NULL,
   crawledAt INTEGER,
@@ -170,18 +170,18 @@ CREATE TABLE crawl_posts (
 
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
-CREATE VIRTUAL TABLE crawl_posts_fts_index USING fts5(title, description, content='crawl_posts');
+CREATE VIRTUAL TABLE crawl_link_posts_fts_index USING fts5(title, description, content='crawl_link_posts');
 
--- triggers to keep crawl_posts_fts_index updated
-CREATE TRIGGER crawl_posts_ai AFTER INSERT ON crawl_posts BEGIN
-  INSERT INTO crawl_posts_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
+-- triggers to keep crawl_link_posts_fts_index updated
+CREATE TRIGGER crawl_link_posts_ai AFTER INSERT ON crawl_link_posts BEGIN
+  INSERT INTO crawl_link_posts_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
 END;
-CREATE TRIGGER crawl_posts_ad AFTER DELETE ON crawl_posts BEGIN
-  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
+CREATE TRIGGER crawl_link_posts_ad AFTER DELETE ON crawl_link_posts BEGIN
+  INSERT INTO crawl_link_posts_fts_index(crawl_link_posts_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
 END;
-CREATE TRIGGER crawl_posts_au AFTER UPDATE ON crawl_posts BEGIN
-  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
-  INSERT INTO crawl_posts_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
+CREATE TRIGGER crawl_link_posts_au AFTER UPDATE ON crawl_link_posts BEGIN
+  INSERT INTO crawl_link_posts_fts_index(crawl_link_posts_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
+  INSERT INTO crawl_link_posts_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
 END;
 
 -- crawled follows
@@ -198,9 +198,12 @@ CREATE TABLE crawl_followgraph (
 -- crawled site publications
 CREATE TABLE crawl_published_sites (
   crawlSourceId INTEGER NOT NULL,
+  pathname TEXT NOT NULL,
   crawledAt INTEGER,
   
   url TEXT NOT NULL,
+  createdAt INTEGER,
+  
   isConfirmedAuthor INTEGER DEFAULT 0,
 
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
diff --git a/dbs/schemas/profile-data.v24.sql.js b/dbs/schemas/profile-data.v24.sql.js
index e0bbb480..5ef1e616 100644
--- a/dbs/schemas/profile-data.v24.sql.js
+++ b/dbs/schemas/profile-data.v24.sql.js
@@ -52,7 +52,7 @@ CREATE TRIGGER crawl_site_descriptions_au AFTER UPDATE ON crawl_site_description
 END;
 
 -- crawled posts
-CREATE TABLE crawl_posts (
+CREATE TABLE crawl_link_posts (
   crawlSourceId INTEGER NOT NULL,
   pathname TEXT NOT NULL,
   crawledAt INTEGER,
@@ -66,18 +66,18 @@ CREATE TABLE crawl_posts (
 
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
-CREATE VIRTUAL TABLE crawl_posts_fts_index USING fts5(title, description, content='crawl_posts');
+CREATE VIRTUAL TABLE crawl_link_posts_fts_index USING fts5(title, description, content='crawl_link_posts');
 
--- triggers to keep crawl_posts_fts_index updated
-CREATE TRIGGER crawl_posts_ai AFTER INSERT ON crawl_posts BEGIN
-  INSERT INTO crawl_posts_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
+-- triggers to keep crawl_link_posts_fts_index updated
+CREATE TRIGGER crawl_link_posts_ai AFTER INSERT ON crawl_link_posts BEGIN
+  INSERT INTO crawl_link_posts_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
 END;
-CREATE TRIGGER crawl_posts_ad AFTER DELETE ON crawl_posts BEGIN
-  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
+CREATE TRIGGER crawl_link_posts_ad AFTER DELETE ON crawl_link_posts BEGIN
+  INSERT INTO crawl_link_posts_fts_index(crawl_link_posts_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
 END;
-CREATE TRIGGER crawl_posts_au AFTER UPDATE ON crawl_posts BEGIN
-  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
-  INSERT INTO crawl_posts_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
+CREATE TRIGGER crawl_link_posts_au AFTER UPDATE ON crawl_link_posts BEGIN
+  INSERT INTO crawl_link_posts_fts_index(crawl_link_posts_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
+  INSERT INTO crawl_link_posts_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
 END;
 
 -- crawled follows
@@ -94,9 +94,12 @@ CREATE TABLE crawl_followgraph (
 -- crawled site publications
 CREATE TABLE crawl_published_sites (
   crawlSourceId INTEGER NOT NULL,
+  pathname TEXT NOT NULL,
   crawledAt INTEGER,
   
   url TEXT NOT NULL,
+  createdAt INTEGER,
+  
   isConfirmedAuthor INTEGER DEFAULT 0,
 
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
diff --git a/web-apis/bg.js b/web-apis/bg.js
index 207d0326..ad8a9304 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -13,7 +13,7 @@ const sitedataManifest = require('./manifests/internal/sitedata')
 const watchlistManifest = require('./manifests/internal/watchlist')
 const templatesManifest = require('./manifests/internal/templates')
 const crawlerManifest = require('./manifests/internal/crawler')
-const postsManifest = require('./manifests/internal/posts')
+const linkFeedManifest = require('./manifests/internal/link-feed')
 const followgraphManifest = require('./manifests/internal/followgraph')
 
 // internal apis
@@ -25,7 +25,7 @@ const sitedataAPI = require('../dbs/sitedata').WEBAPI
 const watchlistAPI = require('./bg/watchlist')
 const templatesAPI = require('./bg/templates')
 const crawlerAPI = require('../crawler').WEBAPI
-const postsAPI = require('./bg/posts')
+const linkFeedAPI = require('./bg/link-feed')
 const followgraphAPI = require('./bg/followgraph')
 
 // external manifests
@@ -63,7 +63,7 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('watchlist', watchlistManifest, watchlistAPI, internalOnly)
   globals.rpcAPI.exportAPI('templates', templatesManifest, templatesAPI, internalOnly)
   globals.rpcAPI.exportAPI('crawler', crawlerManifest, crawlerAPI, internalOnly)
-  globals.rpcAPI.exportAPI('posts', postsManifest, postsAPI, internalOnly)
+  globals.rpcAPI.exportAPI('link-feed', linkFeedManifest, linkFeedAPI, internalOnly)
   globals.rpcAPI.exportAPI('followgraph', followgraphManifest, followgraphAPI, internalOnly)
 
   // external apis
diff --git a/web-apis/bg/posts.js b/web-apis/bg/link-feed.js
similarity index 84%
rename from web-apis/bg/posts.js
rename to web-apis/bg/link-feed.js
index 8e0885e6..78aacaa7 100644
--- a/web-apis/bg/posts.js
+++ b/web-apis/bg/link-feed.js
@@ -4,7 +4,7 @@ const {Url} = require('url')
 const {PermissionsError} = require('beaker-error-constants')
 const dat = require('../../dat')
 const archivesDb = require('../../dbs/archives')
-const postsCrawler = require('../../crawler/posts')
+const linkFeedCrawler = require('../../crawler/link-feed')
 
 // exported api
 // =
@@ -18,7 +18,7 @@ module.exports = {
     assert(!reverse || typeof reverse === 'boolean', 'Reverse must be a boolean')
     assert(!author || typeof author === 'string', 'Author must be a string')
     assert(!authors || !Array.isArray(author), 'Authors must be an array of strings')
-    var posts = await postsCrawler.list({offset, limit, reverse, author, authors})
+    var posts = await linkFeedCrawler.list({offset, limit, reverse, author, authors})
     await Promise.all(posts.map(async (post) => {
       post.author.title = await getUserTitle(post.author)
     }))
@@ -26,7 +26,7 @@ module.exports = {
   },
 
   async get (origin, pathname = undefined) {
-    var post = await postsCrawler.get(origin, pathname)
+    var post = await linkFeedCrawler.get(origin, pathname)
     post.author.title = await getUserTitle(post.author)
     return post
   },
@@ -35,7 +35,7 @@ module.exports = {
     var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
     var userArchive = dat.library.getArchive(userSession.url)
-    return postsCrawler.create(userArchive, content)
+    return linkFeedCrawler.create(userArchive, content)
   },
 
   async edit (pathname, content) {
@@ -43,7 +43,7 @@ module.exports = {
     var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
     var userArchive = dat.library.getArchive(userSession.url)
-    return postsCrawler.edit(userArchive, pathname, content)
+    return linkFeedCrawler.edit(userArchive, pathname, content)
   },
 
   async delete (pathname) {
@@ -51,7 +51,7 @@ module.exports = {
     var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
     var userArchive = dat.library.getArchive(userSession.url)
-    return postsCrawler.delete(userArchive, pathname)
+    return linkFeedCrawler.delete(userArchive, pathname)
   }
 }
 
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index d1c9a5a2..c4e08c3f 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -11,7 +11,7 @@ const sitedataManifest = require('../manifests/internal/sitedata')
 const watchlistManifest = require('../manifests/internal/watchlist')
 const templatesManifest = require('../manifests/internal/templates')
 const crawlerManifest = require('../manifests/internal/crawler')
-const postsManifest = require('../manifests/internal/posts')
+const linkFeedManifest = require('../manifests/internal/link-feed')
 const followgraphManifest = require('../manifests/internal/followgraph')
 
 exports.setup = function (rpc) {
@@ -30,7 +30,7 @@ exports.setup = function (rpc) {
     const watchlistRPC = rpc.importAPI('watchlist', watchlistManifest, opts)
     const templatesRPC = rpc.importAPI('templates', templatesManifest, opts)
     const crawlerRPC = rpc.importAPI('crawler', crawlerManifest, opts)
-    const postsRPC = rpc.importAPI('posts', postsManifest, opts)
+    const linkFeedRPC = rpc.importAPI('link-feed', linkFeedManifest, opts)
     const followgraphRPC = rpc.importAPI('followgraph', followgraphManifest, opts)
 
     // beaker.logger
@@ -183,13 +183,13 @@ exports.setup = function (rpc) {
     beaker.crawler.resetSite = crawlerRPC.resetSite
     beaker.crawler.createEventsStream = () => fromEventStream(crawlerRPC.createEventsStream())
 
-    // beaker.posts
-    beaker.posts = {}
-    beaker.posts.list = postsRPC.list
-    beaker.posts.get = postsRPC.get
-    beaker.posts.create = postsRPC.create
-    beaker.posts.edit = postsRPC.edit
-    beaker.posts.delete = postsRPC.delete
+    // beaker.linkFeed
+    beaker.linkFeed = {}
+    beaker.linkFeed.list = linkFeedRPC.list
+    beaker.linkFeed.get = linkFeedRPC.get
+    beaker.linkFeed.create = linkFeedRPC.create
+    beaker.linkFeed.edit = linkFeedRPC.edit
+    beaker.linkFeed.delete = linkFeedRPC.delete
 
     // beaker.followgraph
     beaker.followgraph = {}
diff --git a/web-apis/manifests/internal/posts.js b/web-apis/manifests/internal/link-feed.js
similarity index 100%
rename from web-apis/manifests/internal/posts.js
rename to web-apis/manifests/internal/link-feed.js

From 58c58c075747f4addf2d8e21fb2cd2639a4f8a7e Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 28 Jan 2019 15:34:35 -0600
Subject: [PATCH 082/245] Rewrite crawler search queries using knex and
 implement dataset/siteTypes params

---
 crawler/published-sites.js |   2 +-
 crawler/search.js          | 302 +++++++++++++++++---------------
 dbs/profile-data-db.js     |  12 +-
 lib/db.js                  |  10 ++
 lib/knex.js                |   1 +
 package-lock.json          | 350 ++++++++++++++++++++++++++++++++++++-
 package.json               |   1 +
 7 files changed, 528 insertions(+), 150 deletions(-)
 create mode 100644 lib/knex.js

diff --git a/crawler/published-sites.js b/crawler/published-sites.js
index 6e066a5e..6294bd6d 100644
--- a/crawler/published-sites.js
+++ b/crawler/published-sites.js
@@ -26,7 +26,7 @@ const JSON_PATH_REGEX = /^\/data\/published-sites\/([^/]+)\.json$/i
  * @typedef {Object} PublishedSites
  * @prop {SiteDescription} author
  * @prop {SiteDescription[]} sites
- * 
+ *
  * @typedef {Object} PublishedSite
  * @prop {string} pathname
  * @prop {string} url
diff --git a/crawler/search.js b/crawler/search.js
index 4fb91399..0fd07fdb 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -8,6 +8,7 @@ const followgraph = require('./followgraph')
 const siteDescriptions = require('./site-descriptions')
 const {getBasicType} = require('../lib/dat')
 const {getSiteDescriptionThumbnailUrl} = require('./util')
+const knex = require('../lib/knex')
 
 /** @type {Array<Object>} */
 const BUILTIN_PAGES = [
@@ -137,7 +138,8 @@ exports.listSuggestions = async function (query = '', opts = {}) {
  * @param {string} opts.user - The current user's URL.
  * @param {string} [opts.query] - The search query.
  * @param {number} [opts.hops=1] - How many hops out in the user's follow graph should be included?
- * @param {string} [opts.type] - Content type to query. Defaults to all except users.
+ * @param {string[]} [opts.datasets] - Datasets to query. Defaults to all. Valid values: 'followgraph', 'link_posts', 'published_sites'.
+ * @param {string[]} [opts.siteTypes] - Site types to query. Defaults to all.
  * @param {number} [opts.since] - Filter results to items created since the given timestamp.
  * @param {number} [opts.offset]
  * @param {number} [opts.limit = 20]
@@ -152,12 +154,13 @@ exports.listSearchResults = async function (opts) {
     highlightNonce,
     results: []
   }
-  var {user, query, hops, type, since, offset, limit} = opts
-  type = type || 'all'
+  var {user, query, hops, datasets, siteTypes, since, offset, limit} = opts
   since = since || 0
   offset = offset || 0
   limit = limit || 20
   hops = Math.min(Math.max(Math.floor(hops), 1), 2) // clamp to [1, 2] for now
+  if (typeof datasets === 'string') datasets = [datasets]
+  if (typeof siteTypes === 'string') siteTypes = [siteTypes]
 
   // prep search terms
   if (query && typeof query === 'string') {
@@ -189,49 +192,20 @@ exports.listSearchResults = async function (opts) {
   }
 
   // run queries
-  if (type === 'all' || type === 'user') {
-    // FOLLOWS
-    let rows
-    if (query) {
-      rows = await db.all(`
-        SELECT
-            desc.url AS url,
-            descSrc.url AS authorUrl,
-            SNIPPET(crawl_site_descriptions_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title,
-            SNIPPET(crawl_site_descriptions_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description,
-            desc.crawledAt
-          FROM crawl_site_descriptions_fts_index desc_fts
-          INNER JOIN crawl_site_descriptions desc ON desc.rowid = desc_fts.rowid
-          LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = desc.url
-          INNER JOIN crawl_sources descSrc ON desc.crawlSourceId = descSrc.id
-          WHERE
-            crawl_site_descriptions_fts_index MATCH ?
-            AND (
-              fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) -- description by a followed user
-              OR (desc.url = ? AND desc.crawlSourceId = ?) -- description by me about me
-            )
-            AND desc.crawledAt >= ?
-          ORDER BY desc.crawledAt
-          LIMIT ?
-          OFFSET ?;
-      `, [query, user, userCrawlSourceId, since, limit, offset])
-    } else {
-      rows = await db.all(`
-        SELECT desc.url AS url, desc.title, desc.description, descSrc.url AS authorUrl, desc.crawledAt
-          FROM crawl_site_descriptions desc
-          LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = desc.url
-          INNER JOIN crawl_sources descSrc ON desc.crawlSourceId = descSrc.id
-          WHERE 
-            (
-              fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) -- description by a followed user
-              OR (desc.url = ? AND desc.crawlSourceId = ?) -- description by me about me
-            )
-            AND desc.crawledAt >= ?
-          ORDER BY desc.crawledAt
-          LIMIT ?
-          OFFSET ?;
-      `, [user, userCrawlSourceId, since, limit, offset])
-    }
+  if (!datasets || datasets.includes('followgraph')) {
+    // FOLLOWGRAPH
+    let rows = await db.all(buildFollowGraphSearchQuery({
+      query,
+      crawlSourceIds,
+      user,
+      userCrawlSourceId,
+      siteTypes,
+      since,
+      limit,
+      offset,
+      startHighlight,
+      endHighlight
+    }))
     rows = _uniqWith(rows, (a, b) => a.url === b.url) // remove duplicates
     await Promise.all(rows.map(async (p) => {
       // fetch additional info
@@ -246,56 +220,19 @@ exports.listSearchResults = async function (opts) {
     }))
     searchResults.results = searchResults.results.concat(rows)
   }
-  if (type !== 'user') {
-    // POSTS
-    let rows
-    if (query) {
-      rows = await db.all(`
-        SELECT
-            post.url,
-            SNIPPET(crawl_link_posts_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title,
-            SNIPPET(crawl_link_posts_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description,
-            post.type,
-            post.pathname,
-            post.crawledAt,
-            post.createdAt,
-            post.updatedAt,
-            postSrc.url AS authorUrl
-          FROM crawl_link_posts_fts_index post_fts
-          INNER JOIN crawl_link_posts post ON post.rowid = post_fts.rowid
-          INNER JOIN crawl_sources postSrc ON post.crawlSourceId = postSrc.id
-          LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = postSrc.url 
-          WHERE
-            crawl_link_posts_fts_index MATCH ?
-            AND (fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) OR post.crawlSourceId = ?)
-            AND post.crawledAt >= ?
-          ORDER BY post.crawledAt
-          LIMIT ?
-          OFFSET ?;
-      `, [query, userCrawlSourceId, since, limit, offset])
-    } else {
-      rows = await db.all(`
-        SELECT
-            post.url,
-            post.title,
-            post.description,
-            post.type,
-            post.pathname,
-            post.crawledAt,
-            post.createdAt,
-            post.updatedAt,
-            postSrc.url AS authorUrl
-          FROM crawl_link_posts post
-          INNER JOIN crawl_sources postSrc ON post.crawlSourceId = postSrc.id
-          LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = postSrc.url 
-          WHERE
-            (fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) OR post.crawlSourceId = ?)
-            AND post.crawledAt >= ?
-          ORDER BY post.crawledAt DESC
-          LIMIT ?
-          OFFSET ?;
-      `, [userCrawlSourceId, since, limit, offset])
-    }
+  if (!datasets || datasets.includes('link_posts')) {
+    // LINK_POSTS
+    let rows = await db.all(buildLinkPostsSearchQuery({
+      query,
+      crawlSourceIds,
+      userCrawlSourceId,
+      siteTypes,
+      since,
+      limit,
+      offset,
+      startHighlight,
+      endHighlight
+    }))
     searchResults.results = searchResults.results.concat(await Promise.all(rows.map(async (p) => {
       // fetch additional info
       var author = await siteDescriptions.getBest({subject: p.authorUrl})
@@ -317,47 +254,19 @@ exports.listSearchResults = async function (opts) {
       }
     })))
   }
-  if (type !== 'user') {
-    // SITES
-    let rows
-    if (query) {
-      rows = await db.all(`
-        SELECT
-            pub.url AS url,
-            pubSrc.url AS authorUrl,
-            SNIPPET(crawl_site_descriptions_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title,
-            SNIPPET(crawl_site_descriptions_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description,
-            desc.crawledAt
-          FROM crawl_site_descriptions_fts_index desc_fts
-          INNER JOIN crawl_site_descriptions desc ON desc.rowid = desc_fts.rowid
-          INNER JOIN crawl_published_sites pub ON pub.url = desc.url
-          INNER JOIN crawl_sources pubSrc ON pub.crawlSourceId = pubSrc.id
-          LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = pubSrc.url
-          WHERE
-            crawl_site_descriptions_fts_index MATCH ?
-            ${''/* TODO AND (',' || desc.type || ',') LIKE ?*/}
-            AND (fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) OR pubSrc.id = ?) -- site published by a me or a followed user
-            AND desc.crawledAt >= ?
-          ORDER BY desc.crawledAt
-          LIMIT ?
-          OFFSET ?;
-      `, [query, /*TODO `%,${type},%`,*/ userCrawlSourceId, since, limit, offset])
-    } else {
-      rows = await db.all(`
-        SELECT pub.url AS url, pubSrc.url AS authorUrl, desc.crawledAt
-          FROM crawl_published_sites pub
-          INNER JOIN crawl_site_descriptions desc ON desc.url = pub.url
-          INNER JOIN crawl_sources pubSrc ON pub.crawlSourceId = pubSrc.id
-          LEFT JOIN crawl_followgraph fgraph ON fgraph.destUrl = pubSrc.url
-          WHERE 
-            ${''/* TODO (',' || desc.type || ',') LIKE ?
-            AND*/} (fgraph.crawlSourceId IN (${crawlSourceIds.join(',')}) OR pubSrc.id = ?) -- site published by a me or a followed user
-            AND desc.crawledAt >= ?
-          ORDER BY pub.crawledAt
-          LIMIT ?
-          OFFSET ?;
-      `, [/* TODO `%,${type},%`,*/ userCrawlSourceId, since, limit, offset])
-    }
+  if (!datasets || datasets.includes('published_sites')) {
+    // PUBLISHED_SITES
+    let rows = await db.all(buildPublishedSitesSearchQuery({
+      query,
+      crawlSourceIds,
+      userCrawlSourceId,
+      siteTypes,
+      since,
+      limit,
+      offset,
+      startHighlight,
+      endHighlight
+    }))
     rows = _uniqWith(rows, (a, b) => a.url === b.url) // remove duplicates
     searchResults.results = searchResults.results.concat(await Promise.all(rows.map(async (row) => {
       // fetch full records
@@ -378,3 +287,122 @@ exports.listSearchResults = async function (opts) {
 
   return searchResults
 }
+
+// internal methods
+// =
+
+function buildFollowGraphSearchQuery ({query, crawlSourceIds, user, userCrawlSourceId, siteTypes, since, limit, offset, startHighlight, endHighlight}) {
+  let sql = knex(query ? 'crawl_site_descriptions_fts_index' : 'crawl_site_descriptions')
+    .select('crawl_site_descriptions.url AS url')
+    .select('crawl_sources.url AS authorUrl')
+    .select('crawl_site_descriptions.crawledAt')
+    .where(builder => builder
+      .whereIn('crawl_followgraph.crawlSourceId', crawlSourceIds) // description by a followed user
+      .orWhere(builder => builder
+        .where('crawl_site_descriptions.url', user) // about me and...
+        .andWhere('crawl_site_descriptions.crawlSourceId', userCrawlSourceId) // by me
+      )
+    )
+    .where('crawl_site_descriptions.crawledAt', '>=', since)
+    .orderBy('crawl_site_descriptions.crawledAt')
+    .limit(limit)
+    .offset(offset)
+  if (query) {
+    sql = sql
+      .select(knex.raw(`SNIPPET(crawl_site_descriptions_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title`))
+      .select(knex.raw(`SNIPPET(crawl_site_descriptions_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description`))
+      .innerJoin('crawl_site_descriptions', 'crawl_site_descriptions.rowid', '=', 'crawl_site_descriptions_fts_index.rowid')
+      .leftJoin('crawl_followgraph', 'crawl_followgraph.destUrl', '=', 'crawl_site_descriptions.url')
+      .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_site_descriptions.crawlSourceId')
+      .whereRaw('crawl_site_descriptions_fts_index MATCH ?', [query])
+  } else {
+    sql = sql
+      .select('crawl_site_descriptions.title')
+      .select('crawl_site_descriptions.description')
+      .leftJoin('crawl_followgraph', 'crawl_followgraph.destUrl', '=', 'crawl_site_descriptions.url')
+      .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_site_descriptions.crawlSourceId')
+  }
+  sql = addSiteTypesClause(sql, siteTypes, 'crawl_site_descriptions')
+  return sql
+}
+
+function buildLinkPostsSearchQuery ({query, crawlSourceIds, userCrawlSourceId, siteTypes, since, limit, offset, startHighlight, endHighlight}) {
+  let sql = knex(query ? 'crawl_link_posts_fts_index' : 'crawl_link_posts')
+    .select('crawl_link_posts.url')
+    .select('crawl_link_posts.type')
+    .select('crawl_link_posts.pathname')
+    .select('crawl_link_posts.crawledAt')
+    .select('crawl_link_posts.createdAt')
+    .select('crawl_link_posts.updatedAt')
+    .select('crawl_sources.url AS authorUrl')
+    .where(builder => builder
+      .whereIn('crawl_followgraph.crawlSourceId', crawlSourceIds) // published by someone I follow
+      .orWhere('crawl_link_posts.crawlSourceId', userCrawlSourceId) // or by me
+    )
+    .andWhere('crawl_link_posts.crawledAt', '>=', since)
+    .orderBy('crawl_link_posts.crawledAt')
+    .limit(limit)
+    .offset(offset)
+  if (query) {
+    sql = sql
+      .select(knex.raw(`SNIPPET(crawl_link_posts_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title`))
+      .select(knex.raw(`SNIPPET(crawl_link_posts_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description`))
+      .innerJoin('crawl_link_posts', 'crawl_link_posts.rowid', '=', 'crawl_link_posts_fts_index.rowid')
+      .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_link_posts.crawlSourceId')
+      .leftJoin('crawl_followgraph', 'crawl_followgraph.destUrl', '=', 'crawl_sources.url')
+      .whereRaw('crawl_link_posts_fts_index MATCH ?', [query])
+  } else {
+    sql = sql
+      .select('crawl_link_posts.title')
+      .select('crawl_link_posts.description')
+      .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_link_posts.crawlSourceId')
+      .leftJoin('crawl_followgraph', 'crawl_followgraph.destUrl', '=', 'crawl_link_posts.url')
+  }
+  sql = addSiteTypesClause(sql, siteTypes, 'crawl_link_posts')
+  return sql
+}
+
+function buildPublishedSitesSearchQuery ({query, crawlSourceIds, userCrawlSourceId, siteTypes, since, limit, offset, startHighlight, endHighlight}) {
+  let sql = knex(query ? 'crawl_site_descriptions_fts_index' : 'crawl_published_sites')
+    .select('crawl_published_sites.url')
+    .select('crawl_sources.url AS authorUrl')
+    .select('crawl_site_descriptions.crawledAt')
+    .where(builder => builder
+      .whereIn('crawl_followgraph.crawlSourceId', crawlSourceIds) // published by someone I follow
+      .orWhere('crawl_published_sites.crawlSourceId', userCrawlSourceId) // or by me
+    )
+    .andWhere('crawl_published_sites.crawledAt', '>=', since)
+    .orderBy('crawl_site_descriptions.crawledAt')
+    .limit(limit)
+    .offset(offset)
+    // ${''/* TODO AND (',' || desc.type || ',') LIKE ?*/}
+    // /*TODO `%,${type},%`,*/
+  if (query) {
+    sql = sql
+      .select(knex.raw(`SNIPPET(crawl_site_descriptions_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title`))
+      .select(knex.raw(`SNIPPET(crawl_site_descriptions_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description`))
+      .innerJoin('crawl_site_descriptions', 'crawl_site_descriptions.rowid', '=', 'crawl_site_descriptions_fts_index.rowid')
+      .innerJoin('crawl_published_sites', 'crawl_published_sites.url', '=', 'crawl_site_descriptions.url')
+      .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_published_sites.crawlSourceId')
+      .leftJoin('crawl_followgraph', 'crawl_followgraph.destUrl', '=', 'crawl_sources.url')
+      .whereRaw('crawl_site_descriptions_fts_index MATCH ?', [query])
+  } else {
+    sql = sql
+      .innerJoin('crawl_site_descriptions', 'crawl_site_descriptions.url', '=', 'crawl_published_sites.url')
+      .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_published_sites.crawlSourceId')
+      .leftJoin('crawl_followgraph', 'crawl_followgraph.destUrl', '=', 'crawl_sources.url')
+  }
+  sql = addSiteTypesClause(sql, siteTypes, 'crawl_site_descriptions')
+  return sql
+}
+
+function addSiteTypesClause (sql, siteTypes, table) {
+  if (siteTypes && siteTypes.length) {
+    sql = sql.where(builder => {
+      for (let t of siteTypes) {
+        builder = builder.orWhereRaw(`(',' || ${table}.type || ',') LIKE ?`, `%,${t},%`)
+      }
+    })
+  }
+  return sql
+}
\ No newline at end of file
diff --git a/dbs/profile-data-db.js b/dbs/profile-data-db.js
index b11d3c0f..d355f8b4 100644
--- a/dbs/profile-data-db.js
+++ b/dbs/profile-data-db.js
@@ -1,8 +1,7 @@
 const sqlite3 = require('sqlite3')
 const path = require('path')
-const fs = require('fs')
 const {cbPromise} = require('../lib/functions')
-const {setupSqliteDB} = require('../lib/db')
+const {setupSqliteDB, handleQueryBuilder} = require('../lib/db')
 
 // typedefs
 // =
@@ -34,29 +33,32 @@ exports.setup = function (opts) {
 }
 
 /**
- * @param {...(string | number | boolean | Array<string | number | boolean>)} args
+ * @param {...(any)} args
  * @return {Promise<any>}
  */
 exports.get = async function (...args) {
   await setupPromise
+  args = handleQueryBuilder(args)
   return cbPromise(cb => db.get(...args, cb))
 }
 
 /**
- * @param {...(string | number | boolean | Array<string | number | boolean>)} args
+ * @param {...(any)} args
  * @return {Promise<Array<any>>}
  */
 exports.all = async function (...args) {
   await setupPromise
+  args = handleQueryBuilder(args)
   return cbPromise(cb => db.all(...args, cb))
 }
 
 /**
- * @param {...(string | number | boolean | Array<string | number | boolean>)} args
+ * @param {...(any)} args
  * @return {Promise<SQLiteResult>}
  */
 exports.run = async function (...args) {
   await setupPromise
+  args = handleQueryBuilder(args)
   return cbPromise(cb => db.run(...args, function (err) {
     if (err) cb(err)
     else cb(null, {lastID: this.lastID})
diff --git a/lib/db.js b/lib/db.js
index 3547d948..503b23df 100644
--- a/lib/db.js
+++ b/lib/db.js
@@ -1,6 +1,7 @@
 const logger = require('../logger').child({category: 'sqlite'})
 const FnQueue = require('function-queue')
 const { cbPromise } = require('./functions')
+const _get = require('lodash.get')
 
 /**
  * Create a transaction lock
@@ -94,3 +95,12 @@ exports.setupSqliteDB = function (db, {setup, migrations}, logTag) {
     })
   })
 }
+
+exports.handleQueryBuilder = function (args) {
+  // detect query builders and replace the args
+  if (args[0] && _get(args[0], 'constructor.name') === 'Builder') {
+    var query = args[0].toSQL()
+    return [query.sql, query.bindings]
+  }
+  return args
+}
\ No newline at end of file
diff --git a/lib/knex.js b/lib/knex.js
new file mode 100644
index 00000000..6478ea3f
--- /dev/null
+++ b/lib/knex.js
@@ -0,0 +1 @@
+module.exports = require('knex')({client: 'sqlite3', useNullAsDefault: true})
\ No newline at end of file
diff --git a/package-lock.json b/package-lock.json
index 2f4c855a..2e4bb9cc 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -4,6 +4,15 @@
   "lockfileVersion": 1,
   "requires": true,
   "dependencies": {
+    "@babel/polyfill": {
+      "version": "7.2.5",
+      "resolved": "https://registry.npmjs.org/@babel/polyfill/-/polyfill-7.2.5.tgz",
+      "integrity": "sha512-8Y/t3MWThtMLYr0YNC/Q76tqN1w30+b0uQMeFUYauG2UGTR19zyUtFrAzT23zNtBxPp+LbE5E/nwV/q/r3y6ug==",
+      "requires": {
+        "core-js": "^2.5.7",
+        "regenerator-runtime": "^0.12.0"
+      }
+    },
     "@beaker/dat-ephemeral-ext-msg": {
       "version": "1.0.1",
       "resolved": "https://registry.npmjs.org/@beaker/dat-ephemeral-ext-msg/-/dat-ephemeral-ext-msg-1.0.1.tgz",
@@ -22,6 +31,11 @@
       "resolved": "https://registry.npmjs.org/@beaker/datignore/-/datignore-1.0.0.tgz",
       "integrity": "sha512-UMOvwf+efn01go0fV/JqAZIgrrObphXwdROgCoPZM+g6iCzeoA9G2vQwfULuw5W4XGHIj+Ro689zFNKfRXTHiw=="
     },
+    "@types/bluebird": {
+      "version": "3.5.25",
+      "resolved": "https://registry.npmjs.org/@types/bluebird/-/bluebird-3.5.25.tgz",
+      "integrity": "sha512-yfhIBix+AIFTmYGtkC0Bi+XGjSkOINykqKvO/Wqdz/DuXlAKK7HmhLAXdPIGsV4xzKcL3ev/zYc4yLNo+OvGaw=="
+    },
     "@types/node": {
       "version": "10.12.18",
       "resolved": "https://registry.npmjs.org/@types/node/-/node-10.12.18.tgz",
@@ -164,11 +178,21 @@
       "resolved": "https://registry.npmjs.org/arr-union/-/arr-union-3.1.0.tgz",
       "integrity": "sha1-45sJrqne+Gao8gbiiK9jkZuuOcQ="
     },
+    "array-each": {
+      "version": "1.0.1",
+      "resolved": "https://registry.npmjs.org/array-each/-/array-each-1.0.1.tgz",
+      "integrity": "sha1-p5SvDAWrF1KEbudTofIRoFugxE8="
+    },
     "array-lru": {
       "version": "1.1.1",
       "resolved": "https://registry.npmjs.org/array-lru/-/array-lru-1.1.1.tgz",
       "integrity": "sha1-DH4bTgIq4Wb/HoRIxZXzGB/NMzc="
     },
+    "array-slice": {
+      "version": "1.1.0",
+      "resolved": "https://registry.npmjs.org/array-slice/-/array-slice-1.1.0.tgz",
+      "integrity": "sha512-B1qMD3RBP7O8o0H2KbrXDyB0IccejMF15+87Lvlor12ONPRHP6gTjXMNkt/d3ZuOGbAe66hFmaCfECI24Ufp6w=="
+    },
     "array-unique": {
       "version": "0.3.2",
       "resolved": "https://registry.npmjs.org/array-unique/-/array-unique-0.3.2.tgz",
@@ -397,6 +421,11 @@
         "nanoassert": "^1.0.0"
       }
     },
+    "bluebird": {
+      "version": "3.5.3",
+      "resolved": "https://registry.npmjs.org/bluebird/-/bluebird-3.5.3.tgz",
+      "integrity": "sha512-/qKPUQlaW1OyR51WeCPBvRnAlnZFUJkCSG5HzGnuIqhgyJtF+T94lFnn33eiazjRm2LAHVy2guNnaq48X9SJuw=="
+    },
     "brace-expansion": {
       "version": "1.1.11",
       "resolved": "https://registry.npmjs.org/brace-expansion/-/brace-expansion-1.1.11.tgz",
@@ -527,7 +556,6 @@
       "version": "2.4.1",
       "resolved": "https://registry.npmjs.org/chalk/-/chalk-2.4.1.tgz",
       "integrity": "sha512-ObN6h1v2fTJSmUXoS3nMQ92LbDK9be4TV+6G+omQlGJFdcUX5heKi1LZ1YnRMIgwTLEj3E24bT6tYni50rlCfQ==",
-      "dev": true,
       "requires": {
         "ansi-styles": "^3.2.1",
         "escape-string-regexp": "^1.0.5",
@@ -538,7 +566,6 @@
           "version": "3.2.1",
           "resolved": "https://registry.npmjs.org/ansi-styles/-/ansi-styles-3.2.1.tgz",
           "integrity": "sha512-VT0ZI6kZRdTh8YyJw3SMbYm/u+NqfsAxEpWO0Pf9sq8/e94WxxOpPKx9FR1FlyCtOVDNOQ+8ntlqFxiRc+r5qA==",
-          "dev": true,
           "requires": {
             "color-convert": "^1.9.0"
           }
@@ -547,7 +574,6 @@
           "version": "5.5.0",
           "resolved": "https://registry.npmjs.org/supports-color/-/supports-color-5.5.0.tgz",
           "integrity": "sha512-QjVjwdXIt408MIiAqCX4oUKsgU2EqAGzs2Ppkm4aQYbjm+ZEWEcW4SfFNTr4uMNZma0ey4f5lgLrkB0aX0QMow==",
-          "dev": true,
           "requires": {
             "has-flag": "^3.0.0"
           }
@@ -739,6 +765,11 @@
       "resolved": "https://registry.npmjs.org/copy-descriptor/-/copy-descriptor-0.1.1.tgz",
       "integrity": "sha1-Z29us8OZl8LuGsOpJP1hJHSPV40="
     },
+    "core-js": {
+      "version": "2.6.3",
+      "resolved": "https://registry.npmjs.org/core-js/-/core-js-2.6.3.tgz",
+      "integrity": "sha512-l00tmFFZOBHtYhN4Cz7k32VM7vTn3rE2ANjQDxdEN6zmXZ/xq1jQuutnmHvMG1ZJ7xd72+TA5YpUK8wz3rWsfQ=="
+    },
     "core-util-is": {
       "version": "1.0.2",
       "resolved": "https://registry.npmjs.org/core-util-is/-/core-util-is-1.0.2.tgz",
@@ -888,6 +919,11 @@
       "resolved": "https://registry.npmjs.org/delegates/-/delegates-1.0.0.tgz",
       "integrity": "sha1-hMbhWbgZBP3KWaDvRM2HDTElD5o="
     },
+    "detect-file": {
+      "version": "1.0.0",
+      "resolved": "https://registry.npmjs.org/detect-file/-/detect-file-1.0.0.tgz",
+      "integrity": "sha1-8NZtA2cqglyxtzvbP+YjEMjlUrc="
+    },
     "detect-libc": {
       "version": "1.0.3",
       "resolved": "https://registry.npmjs.org/detect-libc/-/detect-libc-1.0.3.tgz",
@@ -1097,8 +1133,7 @@
     "escape-string-regexp": {
       "version": "1.0.5",
       "resolved": "https://registry.npmjs.org/escape-string-regexp/-/escape-string-regexp-1.0.5.tgz",
-      "integrity": "sha1-G2HAViGQqN/2rjuyzwIAyhMLhtQ=",
-      "dev": true
+      "integrity": "sha1-G2HAViGQqN/2rjuyzwIAyhMLhtQ="
     },
     "eslint": {
       "version": "4.19.1",
@@ -1361,6 +1396,14 @@
         }
       }
     },
+    "expand-tilde": {
+      "version": "2.0.2",
+      "resolved": "https://registry.npmjs.org/expand-tilde/-/expand-tilde-2.0.2.tgz",
+      "integrity": "sha1-l+gBqgUt8CRU3kawK/YhZCzchQI=",
+      "requires": {
+        "homedir-polyfill": "^1.0.1"
+      }
+    },
     "extend": {
       "version": "3.0.2",
       "resolved": "https://registry.npmjs.org/extend/-/extend-3.0.2.tgz",
@@ -1539,6 +1582,49 @@
         }
       }
     },
+    "findup-sync": {
+      "version": "2.0.0",
+      "resolved": "https://registry.npmjs.org/findup-sync/-/findup-sync-2.0.0.tgz",
+      "integrity": "sha1-kyaxSIwi0aYIhlCoaQGy2akKLLw=",
+      "requires": {
+        "detect-file": "^1.0.0",
+        "is-glob": "^3.1.0",
+        "micromatch": "^3.0.4",
+        "resolve-dir": "^1.0.1"
+      },
+      "dependencies": {
+        "is-extglob": {
+          "version": "2.1.1",
+          "resolved": "https://registry.npmjs.org/is-extglob/-/is-extglob-2.1.1.tgz",
+          "integrity": "sha1-qIwCU1eR8C7TfHahueqXc8gz+MI="
+        },
+        "is-glob": {
+          "version": "3.1.0",
+          "resolved": "https://registry.npmjs.org/is-glob/-/is-glob-3.1.0.tgz",
+          "integrity": "sha1-e6WuJCF4BKxwcHuWkiVnSGzD6Eo=",
+          "requires": {
+            "is-extglob": "^2.1.0"
+          }
+        }
+      }
+    },
+    "fined": {
+      "version": "1.1.1",
+      "resolved": "https://registry.npmjs.org/fined/-/fined-1.1.1.tgz",
+      "integrity": "sha512-jQp949ZmEbiYHk3gkbdtpJ0G1+kgtLQBNdP5edFP7Fh+WAYceLQz6yO1SBj72Xkg8GVyTB3bBzAYrHJVh5Xd5g==",
+      "requires": {
+        "expand-tilde": "^2.0.2",
+        "is-plain-object": "^2.0.3",
+        "object.defaults": "^1.1.0",
+        "object.pick": "^1.2.0",
+        "parse-filepath": "^1.0.1"
+      }
+    },
+    "flagged-respawn": {
+      "version": "1.0.1",
+      "resolved": "https://registry.npmjs.org/flagged-respawn/-/flagged-respawn-1.0.1.tgz",
+      "integrity": "sha512-lNaHNVymajmk0OJMBn8fVUAU1BtDeKIqKoVhk4xAALB57aALg6b4W0MfJ/cUE0g9YBXy5XhSlPIpYIJ7HaY/3Q=="
+    },
     "flat-cache": {
       "version": "1.3.4",
       "resolved": "https://registry.npmjs.org/flat-cache/-/flat-cache-1.3.4.tgz",
@@ -1722,6 +1808,28 @@
         "is-glob": "^2.0.0"
       }
     },
+    "global-modules": {
+      "version": "1.0.0",
+      "resolved": "https://registry.npmjs.org/global-modules/-/global-modules-1.0.0.tgz",
+      "integrity": "sha512-sKzpEkf11GpOFuw0Zzjzmt4B4UZwjOcG757PPvrfhxcLFbq0wpsgpOqxpxtxFiCG4DtG93M6XRVbF2oGdev7bg==",
+      "requires": {
+        "global-prefix": "^1.0.1",
+        "is-windows": "^1.0.1",
+        "resolve-dir": "^1.0.0"
+      }
+    },
+    "global-prefix": {
+      "version": "1.0.2",
+      "resolved": "https://registry.npmjs.org/global-prefix/-/global-prefix-1.0.2.tgz",
+      "integrity": "sha1-2/dDxsFJklk8ZVVoy2btMsASLr4=",
+      "requires": {
+        "expand-tilde": "^2.0.2",
+        "homedir-polyfill": "^1.0.1",
+        "ini": "^1.3.4",
+        "is-windows": "^1.0.1",
+        "which": "^1.2.14"
+      }
+    },
     "globals": {
       "version": "11.9.0",
       "resolved": "https://registry.npmjs.org/globals/-/globals-11.9.0.tgz",
@@ -1759,8 +1867,7 @@
     "has-flag": {
       "version": "3.0.0",
       "resolved": "https://registry.npmjs.org/has-flag/-/has-flag-3.0.0.tgz",
-      "integrity": "sha1-tdRU3CGZriJWmfNGfloH87lVuv0=",
-      "dev": true
+      "integrity": "sha1-tdRU3CGZriJWmfNGfloH87lVuv0="
     },
     "has-unicode": {
       "version": "2.0.1",
@@ -1796,6 +1903,14 @@
         }
       }
     },
+    "homedir-polyfill": {
+      "version": "1.0.1",
+      "resolved": "https://registry.npmjs.org/homedir-polyfill/-/homedir-polyfill-1.0.1.tgz",
+      "integrity": "sha1-TCu8inWJmP7r9e1oWA921GdotLw=",
+      "requires": {
+        "parse-passwd": "^1.0.0"
+      }
+    },
     "http-signature": {
       "version": "1.2.0",
       "resolved": "https://registry.npmjs.org/http-signature/-/http-signature-1.2.0.tgz",
@@ -2042,6 +2157,11 @@
       "resolved": "https://registry.npmjs.org/inspect-custom-symbol/-/inspect-custom-symbol-1.1.0.tgz",
       "integrity": "sha512-vtI2YXBRZBkU6DlfHfd0GtZENfiEiTacAXUd0ZY6HA+X7aPznpFfPmzSC+tHKXAkz9KDSdI4AYfwAMXR5t+isg=="
     },
+    "interpret": {
+      "version": "1.2.0",
+      "resolved": "https://registry.npmjs.org/interpret/-/interpret-1.2.0.tgz",
+      "integrity": "sha512-mT34yGKMNceBQUoVn7iCDKDntA7SC6gycMAWzGx1z/CMCTV7b2AAtXlo3nRyHZ1FelRkQbQjprHSYGwzLtkVbw=="
+    },
     "into-stream": {
       "version": "3.1.0",
       "resolved": "http://registry.npmjs.org/into-stream/-/into-stream-3.1.0.tgz",
@@ -2061,6 +2181,15 @@
       "resolved": "https://registry.npmjs.org/ip/-/ip-1.1.5.tgz",
       "integrity": "sha1-vd7XARQpCCjAoDnnLvJfWq7ENUo="
     },
+    "is-absolute": {
+      "version": "1.0.0",
+      "resolved": "https://registry.npmjs.org/is-absolute/-/is-absolute-1.0.0.tgz",
+      "integrity": "sha512-dOWoqflvcydARa360Gvv18DZ/gRuHKi2NU/wU5X1ZFzdYfH29nkiNZsF3mp4OJ3H4yo9Mx8A/uAGNzpzPN3yBA==",
+      "requires": {
+        "is-relative": "^1.0.0",
+        "is-windows": "^1.0.1"
+      }
+    },
     "is-accessor-descriptor": {
       "version": "0.1.6",
       "resolved": "http://registry.npmjs.org/is-accessor-descriptor/-/is-accessor-descriptor-0.1.6.tgz",
@@ -2205,6 +2334,14 @@
       "integrity": "sha1-eaKp7OfwlugPNtKy87wWwf9L8/o=",
       "dev": true
     },
+    "is-relative": {
+      "version": "1.0.0",
+      "resolved": "https://registry.npmjs.org/is-relative/-/is-relative-1.0.0.tgz",
+      "integrity": "sha512-Kw/ReK0iqwKeu0MITLFuj0jbPAmEiOsIwyIXvvbfa6QfmN9pkD1M+8pdk7Rl/dTKbH34/XBFMbgD4iMJhLQbGA==",
+      "requires": {
+        "is-unc-path": "^1.0.0"
+      }
+    },
     "is-resolvable": {
       "version": "1.1.0",
       "resolved": "https://registry.npmjs.org/is-resolvable/-/is-resolvable-1.1.0.tgz",
@@ -2221,6 +2358,14 @@
       "resolved": "https://registry.npmjs.org/is-typedarray/-/is-typedarray-1.0.0.tgz",
       "integrity": "sha1-5HnICFjfDBsR3dppQPlgEfzaSpo="
     },
+    "is-unc-path": {
+      "version": "1.0.0",
+      "resolved": "https://registry.npmjs.org/is-unc-path/-/is-unc-path-1.0.0.tgz",
+      "integrity": "sha512-mrGpVd0fs7WWLfVsStvgF6iEJnbjDFZh9/emhRDcGWTduTfNHd9CHeUwH3gYIjdbwo4On6hunkztwOaAw0yllQ==",
+      "requires": {
+        "unc-path-regex": "^0.1.2"
+      }
+    },
     "is-windows": {
       "version": "1.0.2",
       "resolved": "https://registry.npmjs.org/is-windows/-/is-windows-1.0.2.tgz",
@@ -2365,6 +2510,40 @@
       "resolved": "https://registry.npmjs.org/kind-of/-/kind-of-6.0.2.tgz",
       "integrity": "sha512-s5kLOcnH0XqDO+FvuaLX8DDjZ18CGFk7VygH40QoKPUQhW4e2rvM0rwUq0t8IQDOwYSeLK01U90OjzBTme2QqA=="
     },
+    "knex": {
+      "version": "0.16.3",
+      "resolved": "https://registry.npmjs.org/knex/-/knex-0.16.3.tgz",
+      "integrity": "sha512-jGTOBW8b7exaBPfCKJSlv5q320IvWw9hEdtnURtbb0k3HusfZrR4UYiEewem8Nl7VqJILoCj99SjCK3W54UNPg==",
+      "requires": {
+        "@babel/polyfill": "^7.0.0",
+        "@types/bluebird": "^3.5.25",
+        "bluebird": "^3.5.3",
+        "chalk": "2.4.1",
+        "commander": "^2.19.0",
+        "debug": "4.1.0",
+        "inherits": "~2.0.3",
+        "interpret": "^1.1.0",
+        "liftoff": "2.5.0",
+        "lodash": "^4.17.11",
+        "minimist": "1.2.0",
+        "mkdirp": "^0.5.1",
+        "pg-connection-string": "2.0.0",
+        "tarn": "^1.1.4",
+        "tildify": "1.2.0",
+        "uuid": "^3.3.2",
+        "v8flags": "^3.1.1"
+      },
+      "dependencies": {
+        "debug": {
+          "version": "4.1.0",
+          "resolved": "https://registry.npmjs.org/debug/-/debug-4.1.0.tgz",
+          "integrity": "sha512-heNPJUJIqC+xB6ayLAMHaIrmN9HKa7aQO8MGqKpvCA+uJYVcvR6l5kgdrhRuwPFHU7P5/A1w0BjByPHwpfTDKg==",
+          "requires": {
+            "ms": "^2.1.1"
+          }
+        }
+      }
+    },
     "kuler": {
       "version": "1.0.1",
       "resolved": "https://registry.npmjs.org/kuler/-/kuler-1.0.1.tgz",
@@ -2411,6 +2590,21 @@
         "type-check": "~0.3.2"
       }
     },
+    "liftoff": {
+      "version": "2.5.0",
+      "resolved": "https://registry.npmjs.org/liftoff/-/liftoff-2.5.0.tgz",
+      "integrity": "sha1-IAkpG7Mc6oYbvxCnwVooyvdcMew=",
+      "requires": {
+        "extend": "^3.0.0",
+        "findup-sync": "^2.0.0",
+        "fined": "^1.0.1",
+        "flagged-respawn": "^1.0.0",
+        "is-plain-object": "^2.0.4",
+        "object.map": "^1.0.0",
+        "rechoir": "^0.6.2",
+        "resolve": "^1.1.7"
+      }
+    },
     "limiter": {
       "version": "1.1.3",
       "resolved": "https://registry.npmjs.org/limiter/-/limiter-1.1.3.tgz",
@@ -2499,6 +2693,14 @@
         }
       }
     },
+    "make-iterator": {
+      "version": "1.0.1",
+      "resolved": "https://registry.npmjs.org/make-iterator/-/make-iterator-1.0.1.tgz",
+      "integrity": "sha512-pxiuXh0iVEq7VM7KMIhs5gxsfxCux2URptUQaXo4iZZJxBAzTPOLE2BumO5dbfVYq/hBJFBR/a1mFDmOx5AGmw==",
+      "requires": {
+        "kind-of": "^6.0.2"
+      }
+    },
     "map-age-cleaner": {
       "version": "0.1.3",
       "resolved": "https://registry.npmjs.org/map-age-cleaner/-/map-age-cleaner-0.1.3.tgz",
@@ -2889,6 +3091,46 @@
         "isobject": "^3.0.0"
       }
     },
+    "object.defaults": {
+      "version": "1.1.0",
+      "resolved": "https://registry.npmjs.org/object.defaults/-/object.defaults-1.1.0.tgz",
+      "integrity": "sha1-On+GgzS0B96gbaFtiNXNKeQ1/s8=",
+      "requires": {
+        "array-each": "^1.0.1",
+        "array-slice": "^1.0.0",
+        "for-own": "^1.0.0",
+        "isobject": "^3.0.0"
+      },
+      "dependencies": {
+        "for-own": {
+          "version": "1.0.0",
+          "resolved": "https://registry.npmjs.org/for-own/-/for-own-1.0.0.tgz",
+          "integrity": "sha1-xjMy9BXO3EsE2/5wz4NklMU8tEs=",
+          "requires": {
+            "for-in": "^1.0.1"
+          }
+        }
+      }
+    },
+    "object.map": {
+      "version": "1.0.1",
+      "resolved": "https://registry.npmjs.org/object.map/-/object.map-1.0.1.tgz",
+      "integrity": "sha1-z4Plncj8wK1fQlDh94s7gb2AHTc=",
+      "requires": {
+        "for-own": "^1.0.0",
+        "make-iterator": "^1.0.0"
+      },
+      "dependencies": {
+        "for-own": {
+          "version": "1.0.0",
+          "resolved": "https://registry.npmjs.org/for-own/-/for-own-1.0.0.tgz",
+          "integrity": "sha1-xjMy9BXO3EsE2/5wz4NklMU8tEs=",
+          "requires": {
+            "for-in": "^1.0.1"
+          }
+        }
+      }
+    },
     "object.omit": {
       "version": "2.0.1",
       "resolved": "https://registry.npmjs.org/object.omit/-/object.omit-2.0.1.tgz",
@@ -2997,6 +3239,16 @@
       "resolved": "https://registry.npmjs.org/parse-dat-url/-/parse-dat-url-3.0.1.tgz",
       "integrity": "sha512-xVq8RDzqy9xlMh43h3iGkak2T8Bk2IRQUTo8eVdGJp8xrk62/OkS+RMAou/cxLAjoTuY0YbYbmxVUemE78NISA=="
     },
+    "parse-filepath": {
+      "version": "1.0.2",
+      "resolved": "https://registry.npmjs.org/parse-filepath/-/parse-filepath-1.0.2.tgz",
+      "integrity": "sha1-pjISf1Oq89FYdvWHLz/6x2PWyJE=",
+      "requires": {
+        "is-absolute": "^1.0.0",
+        "map-cache": "^0.2.0",
+        "path-root": "^0.1.1"
+      }
+    },
     "parse-glob": {
       "version": "3.0.4",
       "resolved": "https://registry.npmjs.org/parse-glob/-/parse-glob-3.0.4.tgz",
@@ -3008,6 +3260,11 @@
         "is-glob": "^2.0.0"
       }
     },
+    "parse-passwd": {
+      "version": "1.0.0",
+      "resolved": "https://registry.npmjs.org/parse-passwd/-/parse-passwd-1.0.0.tgz",
+      "integrity": "sha1-bVuTSkVpk7I9N/QKOC1vFmao5cY="
+    },
     "pascalcase": {
       "version": "0.1.1",
       "resolved": "https://registry.npmjs.org/pascalcase/-/pascalcase-0.1.1.tgz",
@@ -3029,6 +3286,24 @@
       "resolved": "https://registry.npmjs.org/path-key/-/path-key-2.0.1.tgz",
       "integrity": "sha1-QRyttXTFoUDTpLGRDUDYDMn0C0A="
     },
+    "path-parse": {
+      "version": "1.0.6",
+      "resolved": "https://registry.npmjs.org/path-parse/-/path-parse-1.0.6.tgz",
+      "integrity": "sha512-GSmOT2EbHrINBf9SR7CDELwlJ8AENk3Qn7OikK4nFYAu3Ote2+JYNVvkpAEQm3/TLNEJFD/xZJjzyxg3KBWOzw=="
+    },
+    "path-root": {
+      "version": "0.1.1",
+      "resolved": "https://registry.npmjs.org/path-root/-/path-root-0.1.1.tgz",
+      "integrity": "sha1-mkpoFMrBwM1zNgqV8yCDyOpHRbc=",
+      "requires": {
+        "path-root-regex": "^0.1.0"
+      }
+    },
+    "path-root-regex": {
+      "version": "0.1.2",
+      "resolved": "https://registry.npmjs.org/path-root-regex/-/path-root-regex-0.1.2.tgz",
+      "integrity": "sha1-v8zcjfWxLcUsi0PsONGNcsBLqW0="
+    },
     "pauls-dat-api": {
       "version": "8.0.4",
       "resolved": "https://registry.npmjs.org/pauls-dat-api/-/pauls-dat-api-8.0.4.tgz",
@@ -3144,6 +3419,11 @@
       "resolved": "https://registry.npmjs.org/performance-now/-/performance-now-2.1.0.tgz",
       "integrity": "sha1-Ywn04OX6kT7BxpMHrjZLSzd8nns="
     },
+    "pg-connection-string": {
+      "version": "2.0.0",
+      "resolved": "https://registry.npmjs.org/pg-connection-string/-/pg-connection-string-2.0.0.tgz",
+      "integrity": "sha1-Pu/lmX4G2Ugh5NUC5CtqHHP434I="
+    },
     "pify": {
       "version": "3.0.0",
       "resolved": "https://registry.npmjs.org/pify/-/pify-3.0.0.tgz",
@@ -3342,6 +3622,14 @@
         "util-deprecate": "~1.0.1"
       }
     },
+    "rechoir": {
+      "version": "0.6.2",
+      "resolved": "https://registry.npmjs.org/rechoir/-/rechoir-0.6.2.tgz",
+      "integrity": "sha1-hSBLVNuoLVdC4oyWdW70OvUOM4Q=",
+      "requires": {
+        "resolve": "^1.1.6"
+      }
+    },
     "recursive-watch": {
       "version": "1.1.4",
       "resolved": "https://registry.npmjs.org/recursive-watch/-/recursive-watch-1.1.4.tgz",
@@ -3350,6 +3638,11 @@
         "ttl": "^1.3.0"
       }
     },
+    "regenerator-runtime": {
+      "version": "0.12.1",
+      "resolved": "https://registry.npmjs.org/regenerator-runtime/-/regenerator-runtime-0.12.1.tgz",
+      "integrity": "sha512-odxIc1/vDlo4iZcfXqRYFj0vpXFNoGdKMAUieAlFYO6m/nl5e9KR/beGf41z4a1FI+aQgtjhuaSlDxQ0hmkrHg=="
+    },
     "regex-cache": {
       "version": "0.4.4",
       "resolved": "https://registry.npmjs.org/regex-cache/-/regex-cache-0.4.4.tgz",
@@ -3425,6 +3718,23 @@
         "resolve-from": "^1.0.0"
       }
     },
+    "resolve": {
+      "version": "1.10.0",
+      "resolved": "https://registry.npmjs.org/resolve/-/resolve-1.10.0.tgz",
+      "integrity": "sha512-3sUr9aq5OfSg2S9pNtPA9hL1FVEAjvfOC4leW0SNf/mpnaakz2a9femSd6LqAww2RaFctwyf1lCqnTHuF1rxDg==",
+      "requires": {
+        "path-parse": "^1.0.6"
+      }
+    },
+    "resolve-dir": {
+      "version": "1.0.1",
+      "resolved": "https://registry.npmjs.org/resolve-dir/-/resolve-dir-1.0.1.tgz",
+      "integrity": "sha1-eaQGRMNivoLybv/nOcm7U4IEb0M=",
+      "requires": {
+        "expand-tilde": "^2.0.0",
+        "global-modules": "^1.0.0"
+      }
+    },
     "resolve-from": {
       "version": "1.0.1",
       "resolved": "https://registry.npmjs.org/resolve-from/-/resolve-from-1.0.1.tgz",
@@ -4068,6 +4378,11 @@
         "yallist": "^3.0.2"
       }
     },
+    "tarn": {
+      "version": "1.1.4",
+      "resolved": "https://registry.npmjs.org/tarn/-/tarn-1.1.4.tgz",
+      "integrity": "sha512-j4samMCQCP5+6Il9/cxCqBd3x4vvlLeVdoyGex0KixPKl4F8LpNbDSC6NDhjianZgUngElRr9UI1ryZqJDhwGg=="
+    },
     "temp-dir": {
       "version": "1.0.0",
       "resolved": "https://registry.npmjs.org/temp-dir/-/temp-dir-1.0.0.tgz",
@@ -4125,6 +4440,14 @@
       "resolved": "http://registry.npmjs.org/thunky/-/thunky-0.1.0.tgz",
       "integrity": "sha1-vzAUaCTituZ7Dy16Ssi+smkIaE4="
     },
+    "tildify": {
+      "version": "1.2.0",
+      "resolved": "https://registry.npmjs.org/tildify/-/tildify-1.2.0.tgz",
+      "integrity": "sha1-3OwD9V3Km3qj5bBPIYF+tW5jWIo=",
+      "requires": {
+        "os-homedir": "^1.0.0"
+      }
+    },
     "timeout-refresh": {
       "version": "1.0.0",
       "resolved": "https://registry.npmjs.org/timeout-refresh/-/timeout-refresh-1.0.0.tgz",
@@ -4248,6 +4571,11 @@
         "buffer-alloc": "^1.1.0"
       }
     },
+    "unc-path-regex": {
+      "version": "0.1.2",
+      "resolved": "https://registry.npmjs.org/unc-path-regex/-/unc-path-regex-0.1.2.tgz",
+      "integrity": "sha1-5z3T17DXxe2G+6xrCufYxqadUPo="
+    },
     "union-value": {
       "version": "1.0.0",
       "resolved": "https://registry.npmjs.org/union-value/-/union-value-1.0.0.tgz",
@@ -4404,6 +4732,14 @@
       "resolved": "https://registry.npmjs.org/uuid/-/uuid-3.3.2.tgz",
       "integrity": "sha512-yXJmeNaw3DnnKAOKJE51sL/ZaYfWJRl1pK9dr19YFCu0ObS231AB1/LbqTKRAQ5kw8A90rA6fr4riOUpTZvQZA=="
     },
+    "v8flags": {
+      "version": "3.1.2",
+      "resolved": "https://registry.npmjs.org/v8flags/-/v8flags-3.1.2.tgz",
+      "integrity": "sha512-MtivA7GF24yMPte9Rp/BWGCYQNaUj86zeYxV/x2RRJMKagImbbv3u8iJC57lNhWLPcGLJmHcHmFWkNsplbbLWw==",
+      "requires": {
+        "homedir-polyfill": "^1.0.1"
+      }
+    },
     "varint": {
       "version": "5.0.0",
       "resolved": "https://registry.npmjs.org/varint/-/varint-5.0.0.tgz",
diff --git a/package.json b/package.json
index f4f777f4..f8129e8e 100644
--- a/package.json
+++ b/package.json
@@ -51,6 +51,7 @@
     "hyperdrive-network-speed": "^2.1.0",
     "identify-filetype": "^1.0.0",
     "into-stream": "^3.1.0",
+    "knex": "^0.16.3",
     "lodash.debounce": "^4.0.8",
     "lodash.difference": "^4.5.0",
     "lodash.get": "^4.4.2",

From b6fd28fe8b2cf70ec33ca0294e5372f841149374 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 28 Jan 2019 16:54:34 -0600
Subject: [PATCH 083/245] Expand dat helper functions

---
 crawler/search.js |  2 --
 lib/dat.js        | 73 ++++++++++++++++++++++++++++++++++++++++++-----
 2 files changed, 66 insertions(+), 9 deletions(-)

diff --git a/crawler/search.js b/crawler/search.js
index 0fd07fdb..79f812f1 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -375,8 +375,6 @@ function buildPublishedSitesSearchQuery ({query, crawlSourceIds, userCrawlSource
     .orderBy('crawl_site_descriptions.crawledAt')
     .limit(limit)
     .offset(offset)
-    // ${''/* TODO AND (',' || desc.type || ',') LIKE ?*/}
-    // /*TODO `%,${type},%`,*/
   if (query) {
     sql = sql
       .select(knex.raw(`SNIPPET(crawl_site_descriptions_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title`))
diff --git a/lib/dat.js b/lib/dat.js
index a11236f3..386e916e 100644
--- a/lib/dat.js
+++ b/lib/dat.js
@@ -1,16 +1,75 @@
 /**
  * @description
- * Get the first "basic type" found in the dat type array.
+ * Get the first unwalled.garden type
+ * @param {string|string[]} type
+ * @returns {string}
+ */
+const getUnwalledGardenType =
+exports.getUnwalledGardenType = function (type) {
+  if (typeof type === 'string') {
+    type = type.split(',')
+  }
+  if (!type) return
+  return type.find(v => v.startsWith('unwalled.garden/'))
+}
+
+/**
+ * @description
+ * Get a short-from of the unwalled.garden type.
+ * @param {string|string[]} type
+ * @returns {string}
+ * @example
+ *   getShortenedUnwalledGardenType('unwalled.garden/user') // 'user'
+ *   getShortenedUnwalledGardenType('unwalled.garden/channel/blog') // 'channel-blog'
+ *   getShortenedUnwalledGardenType('unwalled.garden/media/photo') // 'media-photo'
+ */
+exports.getShortenedUnwalledGardenType = function (type) {
+  type = getUnwalledGardenType(type)
+  if (type) {
+    type = type.slice('unwalled.garden/'.length)
+    return type.replace(/\//g, '-')
+  }
+}
+
+/**
+ * @description
+ * Get the "basic type" of the dat.
  * "Basic types" are generic descriptions which are used mainly for categorization.
- * @param {string[]} type
+ * @param {string|string[]} type
  * @returns {string}
  */
 exports.getBasicType = function (type) {
-  if (type && Array.isArray(type)) {
-    if (type.includes('user')) return 'user'
-    if (type.includes('web-page')) return 'web-page'
-    if (type.includes('file-share')) return 'file-share'
-    if (type.includes('image-collection')) return 'image-collection'
+  type = getUnwalledGardenType(type)
+  if (type) {
+    if (type.startsWith('unwalled.garden/channel/')) return 'channel'
+    if (type.startsWith('unwalled.garden/media/')) return 'media'
+    switch (type) {
+      case 'unwalled.garden/person':
+      case 'unwalled.garden/organization':
+      case 'unwalled.garden/project':
+      case 'unwalled.garden/bot':
+      case 'unwalled.garden/place':
+        return 'user'
+    }
   }
   return 'other'
 }
+
+/**
+ * @description
+ * Get a human-readable label for a dat type
+ * @param {string|string[]} type
+ * @returns {string}
+ */
+exports.getTypeLabel = function (type) {
+  var t = getUnwalledGardenType(type)
+  if (!t) return 'site'
+
+  // special case some items
+  if (t === 'unwalled.garden/channel/music') return 'music stream'
+  if (t === 'unwalled.garden/channel/video') return 'video stream'
+  if (t === 'unwalled.garden/channel/photo') return 'photo stream'
+
+  // most other items can just extract from the type-url
+  return t.split('/').pop().replace(/-/g, ' ')
+}

From 1f8e3ec86f56ce22b6f4a13af3c9c477a9ad6e55 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 28 Jan 2019 17:11:12 -0600
Subject: [PATCH 084/245] Automatically use known site types when creating
 link-posts

---
 crawler/link-feed.js | 11 ++++++++++-
 lib/dat.js           |  5 +++--
 2 files changed, 13 insertions(+), 3 deletions(-)

diff --git a/crawler/link-feed.js b/crawler/link-feed.js
index 0a5ce5d5..f77e06bc 100644
--- a/crawler/link-feed.js
+++ b/crawler/link-feed.js
@@ -255,7 +255,16 @@ const get = exports.get = async function (url, pathname = undefined) {
 exports.create = async function (archive, content) {
   var valid = validateLinkPostContent(content)
   if (!valid) throw ajv.errorsText(validateLinkPostContent.errors)
-    var filename = generateTimeFilename()
+
+  if (!content.type) {
+    // try to fetch type
+    let desc = await siteDescriptions.getBest({subject: content.url})
+    if (desc && desc.type) {
+      content.type = desc.type
+    }
+  }
+
+  var filename = generateTimeFilename()
   await ensureDirectory(archive, '/data')
   await ensureDirectory(archive, '/data/link-feed')
   await archive.pda.writeFile(`/data/link-feed/${filename}.json`, JSON.stringify({
diff --git a/lib/dat.js b/lib/dat.js
index 386e916e..6af626f6 100644
--- a/lib/dat.js
+++ b/lib/dat.js
@@ -59,11 +59,12 @@ exports.getBasicType = function (type) {
  * @description
  * Get a human-readable label for a dat type
  * @param {string|string[]} type
+ * @param {string} [fallback]
  * @returns {string}
  */
-exports.getTypeLabel = function (type) {
+exports.getTypeLabel = function (type, fallback = 'site') {
   var t = getUnwalledGardenType(type)
-  if (!t) return 'site'
+  if (!t) return fallback
 
   // special case some items
   if (t === 'unwalled.garden/channel/music') return 'music stream'

From 6006fdab1ca22f6a11ee27861b83c1b933ea3916 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 29 Jan 2019 14:12:06 -0600
Subject: [PATCH 085/245] Add more options to followgraph queries

---
 crawler/followgraph.js | 30 +++++++++++++++++++++++++-----
 1 file changed, 25 insertions(+), 5 deletions(-)

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index a7983128..a4f1c155 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -133,9 +133,15 @@ exports.crawlSite = async function (archive, crawlSource) {
  * @param {Object} [opts]
  * @param {string} [opts.followedBy] - (URL) filter results to those followed by the site specified with this param. Causes .followsUser boolean to be set.
  * @param {boolean} [opts.includeDesc] - output a site description instead of a simple URL.
+ * @param {boolean} [opts.includeFollowers] - include .followedBy in the result. Requires includeDesc to be true.
+ * @param {number} [opts.limit]
+ * @param {number} [opts.offset]
  * @returns {Promise<Array<string|SiteDescription>>}
  */
-const listFollowers = exports.listFollowers = async function (subject, {followedBy, includeDesc} = {}) {
+const listFollowers = exports.listFollowers = async function (subject, {followedBy, includeDesc, includeFollowers, offset, limit} = {}) {
+  offset = offset || 0
+  limit = limit || -1
+
   var rows
   if (followedBy) {
     rows = await db.all(`
@@ -147,7 +153,9 @@ const listFollowers = exports.listFollowers = async function (subject, {followed
               INNER JOIN crawl_sources ON crawl_sources.id = crawl_followgraph.crawlSourceId
               WHERE crawl_sources.url = ?
           ))
-    `, [subject, followedBy, followedBy])
+        LIMIT ?
+        OFFSET ?
+    `, [subject, followedBy, followedBy, limit, offset])
   } else {
     rows = await db.all(`
       SELECT f.url
@@ -155,7 +163,9 @@ const listFollowers = exports.listFollowers = async function (subject, {followed
         INNER JOIN crawl_followgraph
           ON crawl_followgraph.crawlSourceId = f.id
           AND crawl_followgraph.destUrl = ?
-    `, [subject])
+        LIMIT ?
+        OFFSET ?
+    `, [subject, limit, offset])
   }
   if (!includeDesc) {
     return rows.map(row => toOrigin(row.url))
@@ -167,6 +177,9 @@ const listFollowers = exports.listFollowers = async function (subject, {followed
     if (followedBy) {
       desc.followsUser = await isAFollowingB(url, followedBy)
     }
+    if (includeFollowers) {
+      desc.followedBy = /** @type Array<SiteDescription> */ (await listFollowers(url, {followedBy, includeDesc: true}))
+    }
     return desc
   }))
 }
@@ -180,16 +193,23 @@ const listFollowers = exports.listFollowers = async function (subject, {followed
  * @param {string} [opts.followedBy] - (URL) filter results to those followed by the site specified with this param. Causes .followsUser boolean to be set.
  * @param {boolean} [opts.includeDesc] - output a site description instead of a simple URL.
  * @param {boolean} [opts.includeFollowers] - include .followedBy in the result. Requires includeDesc to be true.
+ * @param {number} [opts.limit]
+ * @param {number} [opts.offset]
  * @returns {Promise<Array<SiteDescription | string>>}
  */
-const listFollows = exports.listFollows = async function (subject, {followedBy, includeDesc, includeFollowers} = {}) {
+const listFollows = exports.listFollows = async function (subject, {followedBy, includeDesc, includeFollowers, offset, limit} = {}) {
+  offset = offset || 0
+  limit = limit || -1
+
   var rows = await db.all(`
     SELECT crawl_followgraph.destUrl
       FROM crawl_followgraph
       INNER JOIN crawl_sources
         ON crawl_followgraph.crawlSourceId = crawl_sources.id
         AND crawl_sources.url = ?
-  `, [subject])
+      LIMIT ?
+      OFFSET ?
+  `, [subject, limit, offset])
   if (!includeDesc) {
     return rows.map(row => toOrigin(row.destUrl))
   }

From 64a3fe5945f39c263e78948459211712384b6b03 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 30 Jan 2019 14:06:20 -0600
Subject: [PATCH 086/245] Update crawler.listSearchResults output to include
 recordFilename

---
 crawler/search.js | 18 ++++++++++++------
 1 file changed, 12 insertions(+), 6 deletions(-)

diff --git a/crawler/search.js b/crawler/search.js
index 79f812f1..bd03a4f0 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -46,7 +46,7 @@ const BUILTIN_PAGES = [
  * @prop {Array<UserSearchResult|SiteSearchResult|PostSearchResult>} results
  *
  * @typedef {Object} UserSearchResult
- * @prop {string} resultType
+ * @prop {string} recordType
  * @prop {string} url
  * @prop {string} title
  * @prop {string} description
@@ -57,9 +57,10 @@ const BUILTIN_PAGES = [
  * @prop {string} author.url
  *
  * @typedef {Object} PostSearchResult
- * @prop {string} resultType
+ * @prop {string} recordType
  * @prop {string} url
  * @prop {SiteDescription} author
+ * @prop {string} recordFilepath
  * @prop {Object} content
  * @prop {string} content.url
  * @prop {string} content.title
@@ -70,7 +71,7 @@ const BUILTIN_PAGES = [
  * @prop {number} updatedAt
  *
  * @typedef {Object} SiteSearchResult
- * @prop {string} resultType
+ * @prop {string} recordType
  * @prop {string} url
  * @prop {string} title
  * @prop {string} description
@@ -79,6 +80,7 @@ const BUILTIN_PAGES = [
  * @prop {Object} descAuthor
  * @prop {string} descAuthor.url
  * @prop {SiteDescription} author
+ * @prop {string} recordFilepath
  */
 
 // exported api
@@ -213,7 +215,7 @@ exports.listSearchResults = async function (opts) {
       p.followsUser = await followgraph.isAFollowingB(p.url, user)
 
       // massage attrs
-      p.resultType = 'user'
+      p.recordType = 'user'
       p.thumbUrl = getSiteDescriptionThumbnailUrl(p.authorUrl, p.url)
       p.author = {url: p.authorUrl}
       delete p.authorUrl
@@ -239,7 +241,8 @@ exports.listSearchResults = async function (opts) {
 
       // massage attrs
       return {
-        resultType: 'post',
+        recordType: 'link-post',
+        recordFilepath: p.recordFilepath,
         url: p.authorUrl + p.pathname,
         author,
         content: {
@@ -271,7 +274,8 @@ exports.listSearchResults = async function (opts) {
     searchResults.results = searchResults.results.concat(await Promise.all(rows.map(async (row) => {
       // fetch full records
       var result = /**@type SiteSearchResult*/(await siteDescriptions.getBest({subject: row.url, author: row.authorUrl}))
-      result.resultType = 'site'
+      result.recordType = 'published-site'
+      result.recordFilepath = row.recordFilepath
       result.author = await siteDescriptions.getBest({subject: row.authorUrl})
 
       // overwrite title and description so that highlighting can be included
@@ -334,6 +338,7 @@ function buildLinkPostsSearchQuery ({query, crawlSourceIds, userCrawlSourceId, s
     .select('crawl_link_posts.crawledAt')
     .select('crawl_link_posts.createdAt')
     .select('crawl_link_posts.updatedAt')
+    .select('crawl_link_posts.pathname AS recordFilepath')
     .select('crawl_sources.url AS authorUrl')
     .where(builder => builder
       .whereIn('crawl_followgraph.crawlSourceId', crawlSourceIds) // published by someone I follow
@@ -365,6 +370,7 @@ function buildLinkPostsSearchQuery ({query, crawlSourceIds, userCrawlSourceId, s
 function buildPublishedSitesSearchQuery ({query, crawlSourceIds, userCrawlSourceId, siteTypes, since, limit, offset, startHighlight, endHighlight}) {
   let sql = knex(query ? 'crawl_site_descriptions_fts_index' : 'crawl_published_sites')
     .select('crawl_published_sites.url')
+    .select('crawl_published_sites.pathname AS recordFilepath')
     .select('crawl_sources.url AS authorUrl')
     .select('crawl_site_descriptions.crawledAt')
     .where(builder => builder

From c01ebb1cb01ea69f448a264362129a1265b4ded3 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 30 Jan 2019 14:08:05 -0600
Subject: [PATCH 087/245] Per the unwalled.garden spec update, change
 known_sites to known-sites

---
 crawler/site-descriptions.js | 18 +++++++++---------
 crawler/util.js              |  2 +-
 2 files changed, 10 insertions(+), 10 deletions(-)

diff --git a/crawler/site-descriptions.js b/crawler/site-descriptions.js
index 964f1458..16e26a68 100644
--- a/crawler/site-descriptions.js
+++ b/crawler/site-descriptions.js
@@ -18,7 +18,7 @@ const {
 // =
 
 const TABLE_VERSION = 1
-const JSON_PATH_REGEX = /^\/(dat\.json|data\/known_sites\/([^/]+)\/dat\.json)$/i
+const JSON_PATH_REGEX = /^\/(dat\.json|data\/known-sites\/([^/]+)\/dat\.json)$/i
 
 // typedefs
 // =
@@ -245,7 +245,7 @@ exports.getBest = async function ({subject, author} = {}) {
 
 /**
  * @description
- * Capture a site description into the archive's known_sites cache.
+ * Capture a site description into the archive's known-sites cache.
  *
  * @param {InternalDatArchive} archive - where to write the capture to.
  * @param {(InternalDatArchive|string)} subject - which archive to capture.
@@ -262,8 +262,8 @@ exports.capture = async function (archive, subject) {
   // create directory
   var hostname = toHostname(subjectArchive.url)
   await ensureDirectory(archive, '/data')
-  await ensureDirectory(archive, '/data/known_sites')
-  await ensureDirectory(archive, `/data/known_sites/${hostname}`)
+  await ensureDirectory(archive, '/data/known-sites')
+  await ensureDirectory(archive, `/data/known-sites/${hostname}`)
 
   // capture dat.json
   try {
@@ -272,13 +272,13 @@ exports.capture = async function (archive, subject) {
     logger.warn('Failed to read dat.json of subject archive', {details: {err}})
     throw new Error('Unabled to read subject dat.json')
   }
-  await archive.pda.writeFile(`/data/known_sites/${hostname}/dat.json`, JSON.stringify(datJson))
+  await archive.pda.writeFile(`/data/known-sites/${hostname}/dat.json`, JSON.stringify(datJson))
 
   // capture thumb
   for (let ext of ['jpg', 'jpeg', 'png']) {
     let thumbPath = `/thumb.${ext}`
     if (await fileExists(subjectArchive, thumbPath)) {
-      let targetPath = `/data/known_sites/${hostname}/thumb.${ext}`
+      let targetPath = `/data/known-sites/${hostname}/thumb.${ext}`
       await archive.pda.writeFile(targetPath, await subjectArchive.pda.readFile(thumbPath, 'binary'), 'binary')
       break
     }
@@ -287,7 +287,7 @@ exports.capture = async function (archive, subject) {
 
 /**
  * @description
- * Delete a captured site description in the given archive's known_sites cache.
+ * Delete a captured site description in the given archive's known-sites cache.
  *
  * @param {InternalDatArchive} archive - where to remove the capture from.
  * @param {(InternalDatArchive|string)} subject - which archive's capture to remove.
@@ -302,7 +302,7 @@ exports.deleteCapture = async function (archive, subject) {
   }
   assert(typeof subjectUrl === 'string', 'Delete() must be provided a valid URL string')
   var hostname = toHostname(subjectUrl)
-  await archive.pda.rmdir(`/data/known_sites/${hostname}`, {recursive: true})
+  await archive.pda.rmdir(`/data/known-sites/${hostname}`, {recursive: true})
   await crawler.crawlSite(archive)
 }
 
@@ -333,7 +333,7 @@ function toOrigin (url) {
  */
 function getUrlFromDescriptionPath (archive, name) {
   if (name === '/dat.json') return archive.url
-  var parts = name.split('/') // '/data/known_sites/{hostname}/dat.json' -> ['', 'data', 'known_sites', hostname, 'dat.json']
+  var parts = name.split('/') // '/data/known-sites/{hostname}/dat.json' -> ['', 'data', 'known-sites', hostname, 'dat.json']
   return 'dat://' + parts[3]
 }
 
diff --git a/crawler/util.js b/crawler/util.js
index 670f2eaa..a7d7a974 100644
--- a/crawler/util.js
+++ b/crawler/util.js
@@ -173,5 +173,5 @@ exports.ensureDirectory = async function (archive, pathname) {
 exports.getSiteDescriptionThumbnailUrl = function (author, subject) {
   return author === subject
     ? `${subject}/thumb` // self-description, use their own thumb
-    : `${author}/data/known_sites/${toHostname(subject)}/thumb` // use captured thumb
+    : `${author}/data/known-sites/${toHostname(subject)}/thumb` // use captured thumb
 }

From 9477fb30cd9e3e1c7407af4126f234f29a4764f4 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 8 Feb 2019 16:31:51 -0600
Subject: [PATCH 088/245] Render markdown as HTML when served over dat://

---
 dat/protocol.js   |  27 +++++++++--
 dbs/sitedata.js   |   5 +-
 lib/markdown.js   | 119 ++++++++++++++++++++++++++++++++++++++++++++++
 lib/mime.js       |  10 ++++
 package-lock.json |  39 +++++++++++++--
 package.json      |   1 +
 6 files changed, 191 insertions(+), 10 deletions(-)
 create mode 100644 lib/markdown.js

diff --git a/dat/protocol.js b/dat/protocol.js
index 4f74202a..a6881328 100644
--- a/dat/protocol.js
+++ b/dat/protocol.js
@@ -6,6 +6,7 @@ const logger = require('../logger').child({category: 'dat', subcategory: 'dat-se
 const intoStream = require('into-stream')
 const {toZipStream} = require('../lib/zip')
 const slugify = require('slugify')
+const markdown = require('../lib/markdown')
 
 const datDns = require('./dns')
 const datLibrary = require('./library')
@@ -316,6 +317,27 @@ exports.electronHandler = async function (request, respond) {
     }
   }
 
+  Object.assign(headers, {
+    'Content-Security-Policy': cspHeader,
+    'Access-Control-Allow-Origin': '*',
+    'Cache-Control': 'no-cache'
+  })
+
+  // markdown rendering
+  if (!range && entry.path.endsWith('.md') && mime.acceptHeaderMarkdownToHtml(request.headers.Accept)) {
+    let nav = false
+    try { nav = await checkoutFS.pda.readFile('/nav.md', 'utf8') }
+    catch (e) {/* ignore */}
+    let content = await checkoutFS.pda.readFile(entry.path, 'utf8')
+    return respond({
+      statusCode: 200,
+      headers: Object.assign(headers, {
+        'Content-Type': 'text/html'
+      }),
+      data: intoStream(markdown.render(nav, content))
+    })
+  }
+
   // fetch the entry and stream the response
   fileReadStream = checkoutFS.createReadStream(entry.path, range)
   var dataStream = fileReadStream
@@ -326,10 +348,7 @@ exports.electronHandler = async function (request, respond) {
       // send headers, now that we can identify the data
       headersSent = true
       Object.assign(headers, {
-        'Content-Type': mimeType,
-        'Content-Security-Policy': cspHeader,
-        'Access-Control-Allow-Origin': '*',
-        'Cache-Control': 'no-cache'
+        'Content-Type': mimeType
       })
       // TODO
       // Electron is being really aggressive about caching and not following the headers correctly
diff --git a/dbs/sitedata.js b/dbs/sitedata.js
index b2c181e1..99667bff 100644
--- a/dbs/sitedata.js
+++ b/dbs/sitedata.js
@@ -1,10 +1,9 @@
 const sqlite3 = require('sqlite3')
 const path = require('path')
-const url = require('url')
+const parseDatUrl = require('parse-dat-url')
 const { cbPromise } = require('../lib/functions')
 const { setupSqliteDB } = require('../lib/db')
 const datDns = require('../dat/dns')
-const datLibrary = require('../dat/library')
 
 // globals
 // =
@@ -246,7 +245,7 @@ exports.WEBAPI = {
  * @returns {Promise<string>}
  */
 async function extractOrigin (originURL) {
-  var urlp = url.parse(originURL)
+  var urlp = parseDatUrl(originURL)
   if (!urlp || !urlp.host || !urlp.protocol) return
   if (urlp.protocol === 'dat:') {
     urlp.host = await datDns.resolveName(urlp.host)
diff --git a/lib/markdown.js b/lib/markdown.js
new file mode 100644
index 00000000..6bab3c17
--- /dev/null
+++ b/lib/markdown.js
@@ -0,0 +1,119 @@
+const MarkdownIt = require('markdown-it')
+
+var md = MarkdownIt({
+  html: true, // Enable HTML tags in source
+  xhtmlOut: false, // Use '/' to close single tags (<br />)
+  breaks: true, // Convert '\n' in paragraphs into <br>
+  langPrefix: 'language-', // CSS language prefix for fenced blocks
+  linkify: true, // Autoconvert URL-like text to links
+
+  // Enable some language-neutral replacement + quotes beautification
+  typographer: true,
+
+  // Double + single quotes replacement pairs, when typographer enabled,
+  // and smartquotes on. Set doubles to '«»' for Russian, '„“' for German.
+  quotes: '“”‘’',
+
+  // Highlighter function. Should return escaped HTML,
+  // or '' if the source string is not changed
+  highlight: function (/* str, lang */) { return '' }
+})
+
+exports.render = function (nav, content) {
+  return `
+<html>
+  <head>
+    <style>
+      body {
+        display: flex;
+        font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Ubuntu, Cantarell, "Oxygen Sans", "Helvetica Neue", sans-serif;
+        font-size: 14px;
+        width: 100%;
+        line-height: 22.5px;
+      }
+      main {
+        flex: 1;
+        max-width: 750px;
+      }
+      nav {
+        max-width: 200px;
+        padding-right: 4em;
+        overflow: hidden;
+        margin: 0.5em 0;
+      }
+      hr {
+        border: 0;
+        border-top: 1px solid #ccc;
+        margin: 1em 0;
+      }
+      blockquote {
+        margin: 0;
+        padding: 0 1em;
+        border-left: 1em solid #eee;
+      }
+      table {
+        border-collapse: collapse;
+      }
+      td, th {
+        padding: 0.5em 1em;
+      }
+      tbody tr:nth-child(odd) {
+        background: #fafafa;
+      }
+      tbody td {
+        border-top: 1px solid #bbb;
+      }
+      a {
+        color: #2864dc;
+        text-decoration: none;
+      }
+      a:hover {
+        text-decoration: underline;
+      }
+      h1, h2,  h3 {
+        margin: 15px 0;
+        font-weight: 600;
+      }
+      h1, h2 {
+        border-bottom: 1px solid #eee;
+        line-height: 45px;
+      }
+      h1 {
+        font-size: 30px;
+      }
+      h2 {
+        font-size: 24px;
+      }
+      h3 {
+        font-size: 20px;
+      }
+      ul, ol {
+        margin-bottom: 15px;
+      }
+      pre, code {
+        font-family: Consolas, 'Lucida Console', Monaco, monospace;
+        font-size: 13.5px;
+        background: #f0f0f0;
+        border-radius: 2px;
+      }
+      pre {
+        padding: 15px;
+        border: 0;
+        overflow-x: auto;
+      }
+      code {
+        padding: 3px 5px;
+      }
+      pre > code {
+        display: block;
+      }
+    </style>
+  </head>
+  <body>
+    ${nav ? `<nav>${md.render(nav)}</nav>` : ''}
+    <main>${md.render(content)}</main>
+  </body>
+</html>
+  `
+}
+
diff --git a/lib/mime.js b/lib/mime.js
index 8c5d0bd0..74120f3b 100644
--- a/lib/mime.js
+++ b/lib/mime.js
@@ -109,6 +109,16 @@ exports.acceptHeaderExtensions = function (accept) {
   return exts
 }
 
+/**
+ * For a given HTTP accept header, should markdown be converted to HTML?
+ * @param {string | undefined} accept
+ * @returns {boolean}
+ */
+exports.acceptHeaderMarkdownToHtml = function (accept) {
+  var parts = (accept || '').split(',')
+  return (parts.includes('text/html') || (parts.length === 1 && parts[0] === '*/*'))
+}
+
 /**
  * Looks for byte patterns that indicate the 'bytes' chunk is from a binary file.
  * pulled from https://github.com/gjtorikian/isBinaryFile
diff --git a/package-lock.json b/package-lock.json
index 2e4bb9cc..1f70fc64 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -158,7 +158,6 @@
       "version": "1.0.10",
       "resolved": "https://registry.npmjs.org/argparse/-/argparse-1.0.10.tgz",
       "integrity": "sha512-o5Roy6tNG4SL/FOkCAN6RzjiakZS25RLYFrcMttJqbdd8BWrnA+fGz57iN5Pb06pvBGvl5gQ0B48dJlslXvoTg==",
-      "dev": true,
       "requires": {
         "sprintf-js": "~1.0.2"
       }
@@ -1112,6 +1111,11 @@
         "once": "^1.4.0"
       }
     },
+    "entities": {
+      "version": "1.1.2",
+      "resolved": "https://registry.npmjs.org/entities/-/entities-1.1.2.tgz",
+      "integrity": "sha512-f2LZMYl1Fzu7YSBKg+RoROelpOaNrcGmE9AZubeDfrCEia483oW4MI4VyFd5VNHIgQ/7qm1I0wUHK1eJnn2y2w=="
+    },
     "env-variable": {
       "version": "0.0.5",
       "resolved": "https://registry.npmjs.org/env-variable/-/env-variable-0.0.5.tgz",
@@ -2610,6 +2614,14 @@
       "resolved": "https://registry.npmjs.org/limiter/-/limiter-1.1.3.tgz",
       "integrity": "sha512-zrycnIMsLw/3ZxTbW7HCez56rcFGecWTx5OZNplzcXUUmJLmoYArC6qdJzmAN5BWiNXGcpjhF9RQ1HSv5zebEw=="
     },
+    "linkify-it": {
+      "version": "2.1.0",
+      "resolved": "https://registry.npmjs.org/linkify-it/-/linkify-it-2.1.0.tgz",
+      "integrity": "sha512-4REs8/062kV2DSHxNfq5183zrqXMl7WP0WzABH9IeJI+NLm429FgE1PDecltYfnOoFDFlZGh2T8PfZn0r+GTRg==",
+      "requires": {
+        "uc.micro": "^1.0.1"
+      }
+    },
     "lodash": {
       "version": "4.17.11",
       "resolved": "https://registry.npmjs.org/lodash/-/lodash-4.17.11.tgz",
@@ -2722,11 +2734,28 @@
         "object-visit": "^1.0.0"
       }
     },
+    "markdown-it": {
+      "version": "8.4.2",
+      "resolved": "https://registry.npmjs.org/markdown-it/-/markdown-it-8.4.2.tgz",
+      "integrity": "sha512-GcRz3AWTqSUphY3vsUqQSFMbgR38a4Lh3GWlHRh/7MRwz8mcu9n2IO7HOh+bXHrR9kOPDl5RNCaEsrneb+xhHQ==",
+      "requires": {
+        "argparse": "^1.0.7",
+        "entities": "~1.1.1",
+        "linkify-it": "^2.0.0",
+        "mdurl": "^1.0.1",
+        "uc.micro": "^1.0.5"
+      }
+    },
     "math-random": {
       "version": "1.0.1",
       "resolved": "https://registry.npmjs.org/math-random/-/math-random-1.0.1.tgz",
       "integrity": "sha1-izqsWIuKZuSXXjzepn97sylgH6w="
     },
+    "mdurl": {
+      "version": "1.0.1",
+      "resolved": "https://registry.npmjs.org/mdurl/-/mdurl-1.0.1.tgz",
+      "integrity": "sha1-/oWy7HWlkDfyrf7BAP1sYBdhFS4="
+    },
     "mem": {
       "version": "4.0.0",
       "resolved": "https://registry.npmjs.org/mem/-/mem-4.0.0.tgz",
@@ -4147,8 +4176,7 @@
     "sprintf-js": {
       "version": "1.0.3",
       "resolved": "http://registry.npmjs.org/sprintf-js/-/sprintf-js-1.0.3.tgz",
-      "integrity": "sha1-BOaSb2YolTVPPdAVIDYzuFcpfiw=",
-      "dev": true
+      "integrity": "sha1-BOaSb2YolTVPPdAVIDYzuFcpfiw="
     },
     "sqlite3": {
       "version": "4.0.4",
@@ -4558,6 +4586,11 @@
       "resolved": "https://registry.npmjs.org/typedarray/-/typedarray-0.0.6.tgz",
       "integrity": "sha1-hnrHTjhkGHsdPUfZlqeOxciDB3c="
     },
+    "uc.micro": {
+      "version": "1.0.6",
+      "resolved": "https://registry.npmjs.org/uc.micro/-/uc.micro-1.0.6.tgz",
+      "integrity": "sha512-8Y75pvTYkLJW2hWQHXxoqRgV7qb9B+9vFEtidML+7koHUFapnVJAZ6cKs+Qjz5Aw3aZWHMC6u0wJE3At+nSGwA=="
+    },
     "uint48be": {
       "version": "2.0.1",
       "resolved": "https://registry.npmjs.org/uint48be/-/uint48be-2.0.1.tgz",
diff --git a/package.json b/package.json
index f8129e8e..c90777a0 100644
--- a/package.json
+++ b/package.json
@@ -60,6 +60,7 @@
     "lodash.pick": "^4.4.0",
     "lodash.throttle": "^4.1.1",
     "lodash.uniqwith": "^4.5.0",
+    "markdown-it": "^8.4.2",
     "mime": "^1.4.0",
     "mkdirp": "^0.5.1",
     "moment": "^2.23.0",

From 742ae079269ac9bebcec34ce2ed47eb53785d267 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 10 Feb 2019 15:18:23 -0600
Subject: [PATCH 089/245] Fix: only respond with the error page when HTML is
 requested in the dat:// protocol

---
 dat/protocol.js | 23 ++++++++++++++---------
 1 file changed, 14 insertions(+), 9 deletions(-)

diff --git a/dat/protocol.js b/dat/protocol.js
index a6881328..68024076 100644
--- a/dat/protocol.js
+++ b/dat/protocol.js
@@ -53,15 +53,20 @@ exports.electronHandler = async function (request, respond) {
       errorPageInfo.validatedURL = request.url
       errorPageInfo.errorCode = code
     }
-    respond({
-      statusCode: code,
-      headers: {
-        'Content-Type': 'text/html',
-        'Content-Security-Policy': "default-src 'unsafe-inline' beaker:;",
-        'Access-Control-Allow-Origin': '*'
-      },
-      data: intoStream(errorPage(errorPageInfo || (code + ' ' + status)))
-    })
+    var accept = request.headers.Accept || ''
+    if (accept.includes('text/html')) {
+      respond({
+        statusCode: code,
+        headers: {
+          'Content-Type': 'text/html',
+          'Content-Security-Policy': "default-src 'unsafe-inline' beaker:;",
+          'Access-Control-Allow-Origin': '*'
+        },
+        data: intoStream(errorPage(errorPageInfo || (code + ' ' + status)))
+      })
+    } else {
+      respond({statusCode: code})
+    }
   }
   var fileReadStream
   var headersSent = false

From 7e444ec4fccbe1175cde5bc507461207a45326e3 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 15 Feb 2019 10:50:32 -0600
Subject: [PATCH 090/245] Add domainNames DB and API

---
 dat/dns.js                                  | 14 +++-
 dbs/bookmarks.js                            | 10 +--
 dbs/domain-names.js                         | 92 +++++++++++++++++++++
 dbs/schemas/profile-data.sql.js             |  7 ++
 dbs/schemas/profile-data.v24.sql.js         |  7 ++
 lib/const.js                                |  9 ++
 web-apis/bg.js                              |  3 +
 web-apis/fg/beaker.js                       | 10 +++
 web-apis/manifests/internal/domain-names.js |  6 ++
 9 files changed, 152 insertions(+), 6 deletions(-)
 create mode 100644 dbs/domain-names.js
 create mode 100644 web-apis/manifests/internal/domain-names.js

diff --git a/dat/dns.js b/dat/dns.js
index 1b5cf221..4299ca6b 100644
--- a/dat/dns.js
+++ b/dat/dns.js
@@ -1,5 +1,6 @@
 const {InvalidDomainName} = require('beaker-error-constants')
 const sitedataDb = require('../dbs/sitedata')
+const domainNamesDb = require('../dbs/domain-names')
 const {DAT_HASH_REGEX} = require('../lib/const')
 const logger = require('../logger').child({category: 'dat', subcategory: 'dns'})
 
@@ -26,7 +27,18 @@ datDns.resolveName = function () {
 // persistent cache methods
 const sitedataDbOpts = {dontExtractOrigin: true}
 async function read (name, err) {
-  var key = await sitedataDb.get('dat:' + name, 'dat-key', sitedataDbOpts)
+  var key
+  const isRelativeName = !name.includes('.')
+  if (isRelativeName) {
+    // check local mapping
+    let record = await domainNamesDb.get(name)
+    if (record) {
+      key = record.value
+    }
+  } else {
+    // check the cache
+    key = await sitedataDb.get('dat:' + name, 'dat-key', sitedataDbOpts)
+  }
   if (!key) throw err
   return key
 }
diff --git a/dbs/bookmarks.js b/dbs/bookmarks.js
index 62081f2b..6f800b35 100644
--- a/dbs/bookmarks.js
+++ b/dbs/bookmarks.js
@@ -52,7 +52,7 @@ exports.bookmark = async function (profileId, url, {title, tags, notes, pinOrder
     pinOrder = typeof pinOrder === 'undefined' ? oldBookmark.pinOrder : pinOrder
 
     // update record
-    return db.run(`
+    await db.run(`
       INSERT OR REPLACE
         INTO bookmarks (profileId, url, title, tags, notes, pinned, pinOrder)
         VALUES (?, ?, ?, ?, ?, ?, ?)
@@ -67,8 +67,8 @@ exports.bookmark = async function (profileId, url, {title, tags, notes, pinOrder
  * @param {string} url
  * @returns {Promise<void>}
  */
-exports.unbookmark = function (profileId, url) {
-  return db.run(`DELETE FROM bookmarks WHERE profileId = ? AND url = ?`, [profileId, url])
+exports.unbookmark = async function (profileId, url) {
+  await db.run(`DELETE FROM bookmarks WHERE profileId = ? AND url = ?`, [profileId, url])
 }
 
 /**
@@ -77,8 +77,8 @@ exports.unbookmark = function (profileId, url) {
  * @param {boolean} pinned
  * @returns {Promise<void>}
  */
-exports.setBookmarkPinned = function (profileId, url, pinned) {
-  return db.run(`UPDATE bookmarks SET pinned = ? WHERE profileId = ? AND url = ?`, [pinned ? 1 : 0, profileId, url])
+exports.setBookmarkPinned = async function (profileId, url, pinned) {
+  await db.run(`UPDATE bookmarks SET pinned = ? WHERE profileId = ? AND url = ?`, [pinned ? 1 : 0, profileId, url])
 }
 
 /**
diff --git a/dbs/domain-names.js b/dbs/domain-names.js
new file mode 100644
index 00000000..1eba9fc5
--- /dev/null
+++ b/dbs/domain-names.js
@@ -0,0 +1,92 @@
+const db = require('./profile-data-db')
+const {DEFAULT_RELATIVE_DOMAIN_NAMES} = require('../lib/const')
+
+// typedefs
+// =
+
+/**
+ * @typedef {Object} DomainName
+ * @prop {string} name
+ * @prop {string} value
+ * @prop {number} updatedAt
+ * @prop {boolean} isDefault
+ */
+
+// exported methods
+// =
+
+/**
+ * @param {string} name
+ * @param {string} value
+ * @returns {Promise<void>}
+ */
+exports.set = async function (name, value) {
+  // validate
+  const isFQDN = name.includes('.')
+  if (isFQDN) {
+    throw new Error('You cannot override domains with TLDs. For example, you can set "beaker" but not "beaker.com".')
+  }
+
+  // update record
+  await db.run(`
+    INSERT OR REPLACE
+      INTO domain_names (name, value)
+      VALUES (?, ?)
+  `, [name, value])
+}
+
+/**
+ * @param {string} name
+ * @returns {Promise<void>}
+ */
+exports.delete = async function (name) {
+  await db.run(`DELETE FROM domain_names WHERE name = ?`, [name])
+}
+
+/**
+ * @param {string} name
+ * @returns {Promise<DomainName>}
+ */
+exports.get = async function (name) {
+  var record
+  try {
+    record = await db.get(`SELECT name, value, updatedAt FROM domain_names WHERE name = ?`, [name])
+  } catch (e) {
+    console.error('Failed to read domain_name record', e)
+  }
+  if (record) {
+    record.isDefault = false
+  } else {
+    // fallback to defaults
+    if (name in DEFAULT_RELATIVE_DOMAIN_NAMES) {
+      record = {
+        name,
+        value: DEFAULT_RELATIVE_DOMAIN_NAMES[name],
+        updatedAt: undefined,
+        isDefault: true
+      }
+    }
+  }
+  return record
+}
+
+/**
+ * @returns {Promise<Array<DomainName>>}
+ */
+exports.list = async function () {
+  var records = await db.all(`SELECT name, value, updatedAt FROM domain_names`)
+
+  // merge in defaults
+  for (let name in DEFAULT_RELATIVE_DOMAIN_NAMES) {
+    if (!records.find(r => r.name === name)) {
+      records.push({
+        name,
+        value: DEFAULT_RELATIVE_DOMAIN_NAMES,
+        updatedAt: undefined,
+        isDefault: true
+      })
+    }
+  }
+
+  return records
+}
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index 02cb7f1a..32fbd175 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -112,6 +112,13 @@ CREATE TABLE templates (
   FOREIGN KEY (profileId) REFERENCES profiles (id) ON DELETE CASCADE
 );
 
+-- user-assigned relative domain names
+CREATE TABLE domain_names (
+  name TEXT NOT NULL,
+  value TEXT NOT NULL,
+  updatedAt INTEGER DEFAULT (strftime('%s', 'now'))
+);
+
 -- list of sites being crawled
 CREATE TABLE crawl_sources (
   id INTEGER PRIMARY KEY NOT NULL,
diff --git a/dbs/schemas/profile-data.v24.sql.js b/dbs/schemas/profile-data.v24.sql.js
index 5ef1e616..1f876ff5 100644
--- a/dbs/schemas/profile-data.v24.sql.js
+++ b/dbs/schemas/profile-data.v24.sql.js
@@ -7,6 +7,13 @@ CREATE TABLE users (
   createdAt INTEGER
 );
 
+-- user-assigned relative domain names
+CREATE TABLE domain_names (
+  name TEXT NOT NULL,
+  value TEXT NOT NULL,
+  updatedAt INTEGER DEFAULT (strftime('%s', 'now'))
+);
+
 -- list of sites being crawled
 CREATE TABLE crawl_sources (
   id INTEGER PRIMARY KEY NOT NULL,
diff --git a/lib/const.js b/lib/const.js
index 49ef9a62..2bcb4c33 100644
--- a/lib/const.js
+++ b/lib/const.js
@@ -62,3 +62,12 @@ exports.STANDARD_ARCHIVE_TYPES = [
   'videos',
   'website'
 ]
+
+// the default applications
+exports.DEFAULT_RELATIVE_DOMAIN_NAMES = {
+  start: '602dc80c3a89461d06e8a67c5ac27ef13085f42a60573a93504fa2b4746f7865',
+  library: 'e1c19fad6334e0897e9b95e633c2eee3a13003e097d9347cbfdd184d3a144975',
+  bookmarks: 'd57fdfcf1cb81ee449c0633767f24583734ca6f7f878737007b10e35d7e0ec41',
+  profile: '602dc80c3a89461d06e8a67c5ac27ef13085f42a60573a93504fa2b4746f7865',
+  search: '602dc80c3a89461d06e8a67c5ac27ef13085f42a60573a93504fa2b4746f7865'
+}
\ No newline at end of file
diff --git a/web-apis/bg.js b/web-apis/bg.js
index ad8a9304..164e8fa9 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -10,6 +10,7 @@ const bookmarksManifest = require('./manifests/internal/bookmarks')
 const downloadsManifest = require('./manifests/internal/downloads')
 const historyManifest = require('./manifests/internal/history')
 const sitedataManifest = require('./manifests/internal/sitedata')
+const domainNamesManifest = require('./manifests/internal/domain-names')
 const watchlistManifest = require('./manifests/internal/watchlist')
 const templatesManifest = require('./manifests/internal/templates')
 const crawlerManifest = require('./manifests/internal/crawler')
@@ -22,6 +23,7 @@ const archivesAPI = require('./bg/archives')
 const bookmarksAPI = require('./bg/bookmarks')
 const historyAPI = require('./bg/history')
 const sitedataAPI = require('../dbs/sitedata').WEBAPI
+const domainNamesAPI = require('../dbs/domain-names')
 const watchlistAPI = require('./bg/watchlist')
 const templatesAPI = require('./bg/templates')
 const crawlerAPI = require('../crawler').WEBAPI
@@ -60,6 +62,7 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('downloads', downloadsManifest, globals.downloadsWebAPI, internalOnly)
   globals.rpcAPI.exportAPI('history', historyManifest, historyAPI, internalOnly)
   globals.rpcAPI.exportAPI('sitedata', sitedataManifest, sitedataAPI, internalOnly)
+  globals.rpcAPI.exportAPI('domain-names', domainNamesManifest, domainNamesAPI, internalOnly)
   globals.rpcAPI.exportAPI('watchlist', watchlistManifest, watchlistAPI, internalOnly)
   globals.rpcAPI.exportAPI('templates', templatesManifest, templatesAPI, internalOnly)
   globals.rpcAPI.exportAPI('crawler', crawlerManifest, crawlerAPI, internalOnly)
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index c4e08c3f..7c974b89 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -8,6 +8,7 @@ const bookmarksManifest = require('../manifests/internal/bookmarks')
 const downloadsManifest = require('../manifests/internal/downloads')
 const historyManifest = require('../manifests/internal/history')
 const sitedataManifest = require('../manifests/internal/sitedata')
+const domainNamesManifest = require('../manifests/internal/domain-names')
 const watchlistManifest = require('../manifests/internal/watchlist')
 const templatesManifest = require('../manifests/internal/templates')
 const crawlerManifest = require('../manifests/internal/crawler')
@@ -27,6 +28,7 @@ exports.setup = function (rpc) {
     const downloadsRPC = rpc.importAPI('downloads', downloadsManifest, opts)
     const historyRPC = rpc.importAPI('history', historyManifest, opts)
     const sitedataRPC = rpc.importAPI('sitedata', sitedataManifest, opts)
+    const domainNamesRPC = rpc.importAPI('domain-names', domainNamesManifest, opts)
     const watchlistRPC = rpc.importAPI('watchlist', watchlistManifest, opts)
     const templatesRPC = rpc.importAPI('templates', templatesManifest, opts)
     const crawlerRPC = rpc.importAPI('crawler', crawlerManifest, opts)
@@ -159,6 +161,14 @@ exports.setup = function (rpc) {
     beaker.sitedata.clearPermission = sitedataRPC.clearPermission
     beaker.sitedata.clearPermissionAllOrigins = sitedataRPC.clearPermissionAllOrigins
 
+    // beaker.domainNames
+    beaker.domainNames = {
+      set: domainNamesRPC.set,
+      delete: domainNamesRPC.delete,
+      get: domainNamesRPC.get,
+      list: domainNamesRPC.list
+    }
+
     // beaker.watchlist
     beaker.watchlist = {}
     beaker.watchlist.add = watchlistRPC.add
diff --git a/web-apis/manifests/internal/domain-names.js b/web-apis/manifests/internal/domain-names.js
new file mode 100644
index 00000000..a19a931d
--- /dev/null
+++ b/web-apis/manifests/internal/domain-names.js
@@ -0,0 +1,6 @@
+module.exports = {
+  set: 'promise',
+  delete: 'promise',
+  get: 'promise',
+  list: 'promise'
+}
\ No newline at end of file

From fcb9d505633cd824ce00966a51e7565688f3f317 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 15 Feb 2019 14:17:50 -0600
Subject: [PATCH 091/245] Add navigator.importSystemAPI() and move bookmarks
 into that system

---
 dat/protocol.js                          |   2 +-
 dbs/archives.js                          |   2 +-
 dbs/bookmarks.js                         | 206 +++++++++++++++--------
 lib/markdown.js                          |   1 -
 web-apis/bg.js                           |   6 +-
 web-apis/bg/bookmarks.js                 | 107 +++---------
 web-apis/fg.js                           |   4 +-
 web-apis/fg/beaker.js                    |  17 --
 web-apis/fg/navigator-import.js          |  12 ++
 web-apis/manifests/external/bookmarks.js |  10 ++
 web-apis/manifests/internal/bookmarks.js |  23 ---
 11 files changed, 192 insertions(+), 198 deletions(-)
 create mode 100644 web-apis/fg/navigator-import.js
 create mode 100644 web-apis/manifests/external/bookmarks.js
 delete mode 100644 web-apis/manifests/internal/bookmarks.js

diff --git a/dat/protocol.js b/dat/protocol.js
index 68024076..91ef8ed5 100644
--- a/dat/protocol.js
+++ b/dat/protocol.js
@@ -332,7 +332,7 @@ exports.electronHandler = async function (request, respond) {
   if (!range && entry.path.endsWith('.md') && mime.acceptHeaderMarkdownToHtml(request.headers.Accept)) {
     let nav = false
     try { nav = await checkoutFS.pda.readFile('/nav.md', 'utf8') }
-    catch (e) {/* ignore */}
+    catch (e) { /* ignore */ }
     let content = await checkoutFS.pda.readFile(entry.path, 'utf8')
     return respond({
       statusCode: 200,
diff --git a/dbs/archives.js b/dbs/archives.js
index 67df8bc5..f8b3595a 100644
--- a/dbs/archives.js
+++ b/dbs/archives.js
@@ -144,7 +144,7 @@ exports.deleteArchive = async function (key) {
     jetpack.removeAsync(path),
     jetpack.removeAsync(getInternalLocalSyncPath(key))
   ])
-  return info.size
+  return info ? info.size : 0
 }
 
 exports.on = events.on.bind(events)
diff --git a/dbs/bookmarks.js b/dbs/bookmarks.js
index 6f800b35..adde5ab4 100644
--- a/dbs/bookmarks.js
+++ b/dbs/bookmarks.js
@@ -1,10 +1,13 @@
+const assert = require('assert')
 const db = require('./profile-data-db')
 const normalizeUrl = require('normalize-url')
 const lock = require('../lib/lock')
+const knex = require('../lib/knex')
 
 const NORMALIZE_OPTS = {
   stripFragment: false,
   stripWWW: false,
+  removeQueryParameters: false,
   removeTrailingSlash: false
 }
 
@@ -13,14 +16,10 @@ const NORMALIZE_OPTS = {
 
 /**
  * @typedef {Object} Bookmark
- * @prop {boolean} _origin
- * @prop {boolean} _url
- * @prop {boolean} private
  * @prop {number} createdAt
  * @prop {string} href
  * @prop {string} title
  * @prop {string[]} tags
- * @prop {string} notes
  * @prop {boolean} pinned
  * @prop {number} pinOrder
  */
@@ -30,33 +29,31 @@ const NORMALIZE_OPTS = {
 
 /**
  * @param {number} profileId
- * @param {string} url
  * @param {Object} values
- * @param {string} values.title
- * @param {string | string[]} values.tags
- * @param {string} values.notes
- * @param {number} values.pinOrder
+ * @param {string} [values.href]
+ * @param {string} [values.title]
+ * @param {string | string[]} [values.tags]
+ * @param {boolean} [values.pinned]
  * @returns {Promise<void>}
  */
-exports.bookmark = async function (profileId, url, {title, tags, notes, pinOrder}) {
+exports.addBookmark = async function (profileId, {href, title, tags, pinned} = {}) {
+  // validate
+  assertValidHref(href)
+  assertValidTitle(title)
+  if (tags) assertValidTags(tags)
+
+  // massage values
+  href = normalizeUrl(href, NORMALIZE_OPTS)
   var tagsStr = tagsToString(tags)
-  var release = await lock(`bookmark:${url}`)
+
+  // update record
+  var release = await lock(`bookmarksdb`)
   try {
-    // read old bookmark and fallback to old values as needed
-    var oldBookmark = await db.get(`SELECT url, title, pinned, pinOrder FROM bookmarks WHERE profileId = ? AND url = ?`, [profileId, url])
-    oldBookmark = oldBookmark || {}
-    const pinned = oldBookmark.pinned ? 1 : 0
-    title = typeof title === 'undefined' ? oldBookmark.title : title
-    tagsStr = typeof tagsStr === 'undefined' ? oldBookmark.tags : tagsStr
-    notes = typeof notes === 'undefined' ? oldBookmark.notes : notes
-    pinOrder = typeof pinOrder === 'undefined' ? oldBookmark.pinOrder : pinOrder
-
-    // update record
     await db.run(`
       INSERT OR REPLACE
-        INTO bookmarks (profileId, url, title, tags, notes, pinned, pinOrder)
-        VALUES (?, ?, ?, ?, ?, ?, ?)
-    `, [profileId, url, title, tagsStr, notes, pinned, pinOrder])
+        INTO bookmarks (profileId, url, title, tags, pinned)
+        VALUES (?, ?, ?, ?, ?)
+    `, [profileId, href, title, tagsStr, Number(pinned)])
   } finally {
     release()
   }
@@ -64,21 +61,66 @@ exports.bookmark = async function (profileId, url, {title, tags, notes, pinOrder
 
 /**
  * @param {number} profileId
- * @param {string} url
+ * @param {string} bookmarkHref
+ * @param {Object} values
+ * @param {string} [values.href]
+ * @param {string} [values.title]
+ * @param {string | string[]} [values.tags]
+ * @param {boolean} [values.pinned]
  * @returns {Promise<void>}
  */
-exports.unbookmark = async function (profileId, url) {
-  await db.run(`DELETE FROM bookmarks WHERE profileId = ? AND url = ?`, [profileId, url])
+exports.editBookmark = async function (profileId, bookmarkHref, {href, title, tags, pinned} = {}) {
+  // validate
+  assertValidHref(bookmarkHref)
+  if (href) assertValidHref(href)
+  if (title) assertValidTitle(title)
+  if (tags) assertValidTags(tags)
+
+  // massage values
+  bookmarkHref = normalizeUrl(bookmarkHref, NORMALIZE_OPTS)
+  href = href ? normalizeUrl(href, NORMALIZE_OPTS) : undefined
+  var tagsStr = tags ? tagsToString(tags) : undefined
+
+  // read, update, store
+  var release = await lock(`bookmarksdb`)
+  try {
+    var oldBookmark = await db.get(`SELECT url, title, pinned, pinOrder FROM bookmarks WHERE profileId = ? AND url = ?`, [profileId, bookmarkHref])
+
+    if (oldBookmark) {
+      // update record
+      let sql = knex('bookmarks')
+        .where({profileId, url: bookmarkHref})
+      if (typeof href !== 'undefined') sql = sql.update('url', href)
+      if (typeof title !== 'undefined') sql = sql.update('title', title)
+      if (typeof tagsStr !== 'undefined') sql = sql.update('tags', tagsStr)
+      if (typeof pinned !== 'undefined') sql = sql.update('pinned', Number(pinned))
+      await db.run(sql)
+    } else {
+      // insert record
+      await db.run(`
+        INSERT OR REPLACE
+          INTO bookmarks (profileId, url, title, tags, pinned)
+          VALUES (?, ?, ?, ?, ?)
+      `, [profileId, href, title, tagsStr, Number(pinned)])
+    }
+  } finally {
+    release()
+  }
 }
 
 /**
  * @param {number} profileId
- * @param {string} url
- * @param {boolean} pinned
+ * @param {string} href
  * @returns {Promise<void>}
  */
-exports.setBookmarkPinned = async function (profileId, url, pinned) {
-  await db.run(`UPDATE bookmarks SET pinned = ? WHERE profileId = ? AND url = ?`, [pinned ? 1 : 0, profileId, url])
+exports.removeBookmark = async function (profileId, href) {
+  href = normalizeUrl(href, NORMALIZE_OPTS)
+  var release = await lock(`bookmarksdb`)
+  try {
+    await db.run(`DELETE FROM bookmarks WHERE profileId = ? AND url = ?`, [profileId, href])
+  } finally {
+    release()
+  }
 }
 
 /**
@@ -88,9 +130,14 @@ exports.setBookmarkPinned = async function (profileId, url, pinned) {
  */
 exports.setBookmarkPinOrder = async function (profileId, urls) {
   var len = urls.length
-  await Promise.all(urls.map((url, i) => (
-    db.run(`UPDATE bookmarks SET pinOrder = ? WHERE profileId = ? AND url = ?`, [len - i, profileId, url])
-  )))
+  var release = await lock(`bookmarksdb`)
+  try {
+    await Promise.all(urls.map((url, i) => (
+      db.run(`UPDATE bookmarks SET pinOrder = ? WHERE profileId = ? AND url = ?`, [len - i, profileId, url])
+    )))
+  } finally {
+    release()
+  }
 }
 
 /**
@@ -98,43 +145,50 @@ exports.setBookmarkPinOrder = async function (profileId, urls) {
  * @param {string} url
  * @returns {Promise<Bookmark>}
  */
-exports.getBookmark = async function (profileId, url) {
-  return toNewFormat(await db.get(`SELECT url, title, tags, notes, pinned, pinOrder, createdAt FROM bookmarks WHERE profileId = ? AND url = ?`, [profileId, url]))
+exports.getBookmark = async function (profileId, href) {
+  href = normalizeUrl(href, NORMALIZE_OPTS)
+  return toNewFormat(await db.get(`SELECT url, title, tags, pinned, pinOrder, createdAt FROM bookmarks WHERE profileId = ? AND url = ?`, [profileId, href]))
 }
 
 /**
  * @param {number} profileId
  * @param {Object} [opts]
- * @param {string} [opts.tag]
+ * @param {Object} [opts.filters]
+ * @param {string|string[]} [opts.filters.tag]
+ * @param {boolean} [opts.filters.isPinned]
  * @returns {Promise<Array<Bookmark>>}
  */
-exports.listBookmarks = async function (profileId, {tag} = {}) {
-  var bookmarks = await db.all(`SELECT url, title, tags, notes, pinned, pinOrder, createdAt FROM bookmarks WHERE profileId = ? ORDER BY createdAt DESC`, [profileId])
+exports.listBookmarks = async function (profileId, {filters} = {}) {
+  let sql = knex('bookmarks')
+    .select('url')
+    .select('title')
+    .select('tags')
+    .select('pinned')
+    .select('pinOrder')
+    .select('createdAt')
+    .where('profileId', '=', profileId)
+    .orderBy('createdAt', 'DESC')
+  if (filters && filters.isPinned) {
+    sql = sql.where('pinned', '=', '1')
+  }
+
+  var bookmarks = await db.all(sql)
   bookmarks = bookmarks.map(toNewFormat)
 
   // apply tag filter
-  if (tag) {
-    if (Array.isArray(tag)) {
+  if (filters && filters.tag) {
+    if (Array.isArray(filters.tag)) {
       bookmarks = bookmarks.filter(b => {
-        return tag.reduce((agg, t) => agg & b.tags.includes(t), true)
+        return /** @type string[] */(filters.tag).reduce((agg, t) => agg && b.tags.includes(t), true)
       })
     } else {
-      bookmarks = bookmarks.filter(b => b.tags.includes(tag))
+      bookmarks = bookmarks.filter(b => b.tags.includes(filters.tag))
     }
   }
 
   return bookmarks
 }
 
-/**
- * @param {number} profileId
- * @returns {Promise<Array<Bookmark>>}
- */
-exports.listPinnedBookmarks = async function (profileId) {
-  var bookmarks = await db.all(`SELECT url, title, tags, notes, pinned, pinOrder, createdAt FROM bookmarks WHERE profileId = ? AND pinned = 1 ORDER BY pinOrder DESC`, [profileId])
-  return bookmarks.map(toNewFormat)
-}
-
 /**
  * @param {number} profileId
  * @returns {Promise<Array<string>>}
@@ -150,22 +204,6 @@ exports.listBookmarkTags = async function (profileId) {
   return Array.from(tagSet)
 }
 
-/**
- * @description
- * TEMP
- * apply normalization to old bookmarks
- * (can probably remove this in 2018 or so)
- * -prf
- * @returns {Promise<void>}
- */
-exports.fixOldBookmarks = async function () {
-  var bookmarks = await db.all(`SELECT url FROM bookmarks`)
-  bookmarks.forEach(b => {
-    let newUrl = normalizeUrl(b.url, NORMALIZE_OPTS)
-    db.run(`UPDATE bookmarks SET url = ? WHERE url = ?`, [newUrl, b.url])
-  })
-}
-
 /**
  * @param {string | string[]} v
  * @returns {string}
@@ -184,15 +222,39 @@ function tagsToString (v) {
 function toNewFormat (b) {
   if (!b) return null
   return {
-    _origin: false,
-    _url: false,
-    private: true,
     createdAt: b.createdAt * 1e3, // convert to ms
     href: b.url,
     title: b.title,
     tags: b.tags ? b.tags.split(' ').filter(Boolean) : [],
-    notes: b.notes,
     pinned: !!b.pinned,
     pinOrder: b.pinOrder
   }
 }
+
+/**
+ * @param {string} v
+ * @returns {void}
+ */
+function assertValidHref (v) {
+  assert(v && typeof v === 'string', 'href must be a valid URL')
+}
+
+/**
+ * @param {string} v
+ * @returns {void}
+ */
+function assertValidTitle (v) {
+  assert(v && typeof v === 'string', 'title must be a non-empty string')
+}
+
+/**
+ * @param {string|string[]} v
+ * @returns {void}
+ */
+function assertValidTags (v) {
+  if (Array.isArray(v)) {
+    assert(v.every(item => typeof item === 'string'), 'tags must be a string or array or strings')
+  } else {
+    assert(typeof v === 'string', 'tags must be a string or array or strings')
+  }
+}
diff --git a/lib/markdown.js b/lib/markdown.js
index 6bab3c17..4f4f53c8 100644
--- a/lib/markdown.js
+++ b/lib/markdown.js
@@ -116,4 +116,3 @@ exports.render = function (nav, content) {
 </html>
   `
 }
-
diff --git a/web-apis/bg.js b/web-apis/bg.js
index 164e8fa9..45a7b431 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -6,7 +6,6 @@ const SECURE_ORIGIN_REGEX = /^(beaker:|dat:|https:|http:\/\/localhost(\/|:))/i
 const loggerManifest = require('./manifests/internal/logger')
 const archivesManifest = require('./manifests/internal/archives')
 const beakerBrowserManifest = require('./manifests/internal/browser')
-const bookmarksManifest = require('./manifests/internal/bookmarks')
 const downloadsManifest = require('./manifests/internal/downloads')
 const historyManifest = require('./manifests/internal/history')
 const sitedataManifest = require('./manifests/internal/sitedata')
@@ -20,7 +19,6 @@ const followgraphManifest = require('./manifests/internal/followgraph')
 // internal apis
 const loggerAPI = require('../logger').WEBAPI
 const archivesAPI = require('./bg/archives')
-const bookmarksAPI = require('./bg/bookmarks')
 const historyAPI = require('./bg/history')
 const sitedataAPI = require('../dbs/sitedata').WEBAPI
 const domainNamesAPI = require('../dbs/domain-names')
@@ -33,10 +31,12 @@ const followgraphAPI = require('./bg/followgraph')
 // external manifests
 const datArchiveManifest = require('./manifests/external/dat-archive')
 const spellCheckerManifest = require('./manifests/external/spell-checker')
+const bookmarksManifest = require('./manifests/external/bookmarks')
 
 // external apis
 const datArchiveAPI = require('./bg/dat-archive')
 const spellCheckerAPI = require('./bg/spell-checker')
+const bookmarksAPI = require('./bg/bookmarks')
 
 // experimental manifests
 const experimentalCapturePageManifest = require('./manifests/external/experimental/capture-page')
@@ -58,7 +58,6 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('logger', loggerManifest, loggerAPI, internalOnly)
   globals.rpcAPI.exportAPI('archives', archivesManifest, archivesAPI, internalOnly)
   globals.rpcAPI.exportAPI('beaker-browser', beakerBrowserManifest, globals.browserWebAPI, internalOnly)
-  globals.rpcAPI.exportAPI('bookmarks', bookmarksManifest, bookmarksAPI, internalOnly)
   globals.rpcAPI.exportAPI('downloads', downloadsManifest, globals.downloadsWebAPI, internalOnly)
   globals.rpcAPI.exportAPI('history', historyManifest, historyAPI, internalOnly)
   globals.rpcAPI.exportAPI('sitedata', sitedataManifest, sitedataAPI, internalOnly)
@@ -72,6 +71,7 @@ exports.setup = function () {
   // external apis
   globals.rpcAPI.exportAPI('dat-archive', datArchiveManifest, datArchiveAPI, secureOnly)
   globals.rpcAPI.exportAPI('spell-checker', spellCheckerManifest, spellCheckerAPI)
+  globals.rpcAPI.exportAPI('bookmarks', bookmarksManifest, bookmarksAPI, secureOnly)
 
   // experimental apis
   globals.rpcAPI.exportAPI('experimental-capture-page', experimentalCapturePageManifest, experimentalCapturePageAPI, secureOnly)
diff --git a/web-apis/bg/bookmarks.js b/web-apis/bg/bookmarks.js
index 5e2e64c3..2acba4fe 100644
--- a/web-apis/bg/bookmarks.js
+++ b/web-apis/bg/bookmarks.js
@@ -1,37 +1,30 @@
 const globals = require('../../globals')
-const assert = require('assert')
-const normalizeUrl = require('normalize-url')
 const {PermissionsError} = require('beaker-error-constants')
 const bookmarksDb = require('../../dbs/bookmarks')
 
-const NORMALIZE_OPTS = {
-  stripFragment: false,
-  stripWWW: false,
-  removeQueryParameters: false,
-  removeTrailingSlash: false
-}
-
 // exported api
 // =
 
 module.exports = {
+  async list (opts) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    return bookmarksDb.listBookmarks(0, opts)
+  },
 
-  // current user
-  // =
+  async listTags () {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    return bookmarksDb.listBookmarkTags(0)
+  },
 
   // fetch bookmark data from the current user's data
-  async getBookmark (href) {
-    await assertPermission(this.sender, 'app:bookmarks:read')
-    assertString(href, 'Parameter one must be a URL')
-    href = normalizeUrl(href, NORMALIZE_OPTS)
+  async get (href) {
+    await assertPermission(this.sender, 'dangerousAppControl')
     return bookmarksDb.getBookmark(0, href)
   },
 
   // check if bookmark exists in the current user's data
-  async isBookmarked (href) {
-    await assertPermission(this.sender, 'app:bookmarks:read')
-    assertString(href, 'Parameter one must be a URL')
-    href = normalizeUrl(href, NORMALIZE_OPTS)
+  async has (href) {
+    await assertPermission(this.sender, 'dangerousAppControl')
     try {
       var bookmark = await bookmarksDb.getBookmark(0, href)
       return !!bookmark
@@ -40,67 +33,27 @@ module.exports = {
     }
   },
 
-  // pins
-  // =
-
-  // pin a bookmark
-  async setBookmarkPinned (href, pinned) {
-    await assertPermission(this.sender, 'app:bookmarks:edit-private')
-    assertString(href, 'Parameter one must be a URL')
-    href = normalizeUrl(href, NORMALIZE_OPTS)
-    await bookmarksDb.setBookmarkPinned(0, href, pinned)
-  },
-
-  // set the order of pinned bookmarks
-  async setBookmarkPinOrder (urls) {
-    await assertPermission(this.sender, 'app:bookmarks:edit-private')
-    if (!Array.isArray(urls)) throw new Error('Parameter one must be an array of URLs')
-    return bookmarksDb.setBookmarkPinOrder(0, urls)
-  },
-
-  // list pinned bookmarks
-  async listPinnedBookmarks () {
-    await assertPermission(this.sender, 'app:bookmarks:read')
-    return bookmarksDb.listPinnedBookmarks(0)
+  async add (data) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    await bookmarksDb.addBookmark(0, data)
   },
 
-  // bookmarks
-  // =
-
-  // bookmark
-  // - data.title: string
-  async bookmarkPrivate (href, data = {}) {
-    await assertPermission(this.sender, 'app:bookmarks:edit-private')
-    assertString(href, 'Parameter one must be a URL')
-    href = normalizeUrl(href, NORMALIZE_OPTS)
-    await bookmarksDb.bookmark(0, href, data)
-  },
-
-  // delete bookmark
-  async unbookmarkPrivate (href) {
-    await assertPermission(this.sender, 'app:bookmarks:edit-private')
-    assertString(href, 'Parameter one must be a URL')
-    href = normalizeUrl(href, NORMALIZE_OPTS)
-    await bookmarksDb.unbookmark(0, href)
-  },
-
-  // list bookmarks
-  async listPrivateBookmarks (opts) {
-    await assertPermission(this.sender, 'app:bookmarks:read')
-    return bookmarksDb.listBookmarks(0, opts)
+  async edit (href, data = {}) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    await bookmarksDb.editBookmark(0, href, data)
   },
 
-  // TODO removeme -prf
-  async listPublicBookmarks () {
-    return []
+  async remove (href) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    await bookmarksDb.removeBookmark(0, href)
   },
 
-  // tags
-  // =
-
-  async listBookmarkTags () {
-    await assertPermission(this.sender, 'app:bookmarks:read')
-    return bookmarksDb.listBookmarkTags(0)
+  async configure (opts) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    if (opts.pins) {
+      if (!Array.isArray(opts.pins)) throw new Error('.pins must be an array of URLs')
+      return bookmarksDb.setBookmarkPinOrder(0, opts.pins)
+    }
   }
 }
 
@@ -108,10 +61,6 @@ async function assertPermission (sender, perm) {
   if (sender.getURL().startsWith('beaker:')) {
     return true
   }
-  if (await globals.permsAPI.queryPermission(perm, sender)) return true
+  if (await globals.permsAPI.requestPermission(perm, sender)) return true
   throw new PermissionsError()
 }
-
-function assertString (v, msg) {
-  assert(!!v && typeof v === 'string', msg)
-}
diff --git a/web-apis/fg.js b/web-apis/fg.js
index b42b9365..21c65eed 100644
--- a/web-apis/fg.js
+++ b/web-apis/fg.js
@@ -1,6 +1,7 @@
 const DatArchive = require('./fg/dat-archive')
 const beaker = require('./fg/beaker')
 const experimental = require('./fg/experimental')
+const navigatorImport = require('./fg/navigator-import')
 
 exports.setup = function ({rpcAPI}) {
   // setup APIs
@@ -11,5 +12,6 @@ exports.setup = function ({rpcAPI}) {
   if (['beaker:', 'dat:'].includes(window.location.protocol)) {
     window.beaker = beaker.setup(rpcAPI)
     window.experimental = experimental.setup(rpcAPI)
+    navigator.importSystemAPI = navigatorImport.setup(rpcAPI)
   }
-}
+}
\ No newline at end of file
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index 7c974b89..6725ae79 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -4,7 +4,6 @@ const errors = require('beaker-error-constants')
 const loggerManifest = require('../manifests/internal/logger')
 const archivesManifest = require('../manifests/internal/archives')
 const beakerBrowserManifest = require('../manifests/internal/browser')
-const bookmarksManifest = require('../manifests/internal/bookmarks')
 const downloadsManifest = require('../manifests/internal/downloads')
 const historyManifest = require('../manifests/internal/history')
 const sitedataManifest = require('../manifests/internal/sitedata')
@@ -24,7 +23,6 @@ exports.setup = function (rpc) {
     const loggerRPC = rpc.importAPI('logger', loggerManifest, opts)
     const archivesRPC = rpc.importAPI('archives', archivesManifest, opts)
     const beakerBrowserRPC = rpc.importAPI('beaker-browser', beakerBrowserManifest, opts)
-    const bookmarksRPC = rpc.importAPI('bookmarks', bookmarksManifest, opts)
     const downloadsRPC = rpc.importAPI('downloads', downloadsManifest, opts)
     const historyRPC = rpc.importAPI('history', historyManifest, opts)
     const sitedataRPC = rpc.importAPI('sitedata', sitedataManifest, opts)
@@ -113,21 +111,6 @@ exports.setup = function (rpc) {
     beaker.browser.doTest = beakerBrowserRPC.doTest
     beaker.browser.closeModal = beakerBrowserRPC.closeModal
 
-    // beaker.bookmarks
-    beaker.bookmarks = {}
-    beaker.bookmarks.getBookmark = bookmarksRPC.getBookmark
-    beaker.bookmarks.isBookmarked = bookmarksRPC.isBookmarked
-    beaker.bookmarks.bookmarkPublic = bookmarksRPC.bookmarkPublic
-    beaker.bookmarks.unbookmarkPublic = bookmarksRPC.unbookmarkPublic
-    beaker.bookmarks.listPublicBookmarks = bookmarksRPC.listPublicBookmarks
-    beaker.bookmarks.setBookmarkPinned = bookmarksRPC.setBookmarkPinned
-    beaker.bookmarks.setBookmarkPinOrder = bookmarksRPC.setBookmarkPinOrder
-    beaker.bookmarks.listPinnedBookmarks = bookmarksRPC.listPinnedBookmarks
-    beaker.bookmarks.bookmarkPrivate = bookmarksRPC.bookmarkPrivate
-    beaker.bookmarks.unbookmarkPrivate = bookmarksRPC.unbookmarkPrivate
-    beaker.bookmarks.listPrivateBookmarks = bookmarksRPC.listPrivateBookmarks
-    beaker.bookmarks.listBookmarkTags = bookmarksRPC.listBookmarkTags
-
     // beaker.downloads
     beaker.downloads = {}
     beaker.downloads.getDownloads = downloadsRPC.getDownloads
diff --git a/web-apis/fg/navigator-import.js b/web-apis/fg/navigator-import.js
new file mode 100644
index 00000000..327504b1
--- /dev/null
+++ b/web-apis/fg/navigator-import.js
@@ -0,0 +1,12 @@
+const errors = require('beaker-error-constants')
+const bookmarksManifest = require('../manifests/external/bookmarks')
+
+exports.setup = function (rpc) {
+  const opts = { timeout: false, errors }
+  return function (name) {
+    if (name === 'bookmarks') {
+      return rpc.importAPI('bookmarks', bookmarksManifest, opts)
+    }
+    throw new Error(`Unknown API: ${name}`)
+  }
+}
\ No newline at end of file
diff --git a/web-apis/manifests/external/bookmarks.js b/web-apis/manifests/external/bookmarks.js
new file mode 100644
index 00000000..f841f449
--- /dev/null
+++ b/web-apis/manifests/external/bookmarks.js
@@ -0,0 +1,10 @@
+module.exports = {
+  list: 'promise',
+  listTags: 'promise',
+  get: 'promise',
+  has: 'promise',
+  add: 'promise',
+  edit: 'promise',
+  remove: 'promise',
+  configure: 'promise'
+}
\ No newline at end of file
diff --git a/web-apis/manifests/internal/bookmarks.js b/web-apis/manifests/internal/bookmarks.js
deleted file mode 100644
index 02101894..00000000
--- a/web-apis/manifests/internal/bookmarks.js
+++ /dev/null
@@ -1,23 +0,0 @@
-module.exports = {
-  // current user
-  getBookmark: 'promise',
-  isBookmarked: 'promise',
-
-  // public
-  bookmarkPublic: 'promise',
-  unbookmarkPublic: 'promise',
-  listPublicBookmarks: 'promise',
-
-  // pins
-  setBookmarkPinned: 'promise',
-  setBookmarkPinOrder: 'promise',
-  listPinnedBookmarks: 'promise',
-
-  // private
-  bookmarkPrivate: 'promise',
-  unbookmarkPrivate: 'promise',
-  listPrivateBookmarks: 'promise',
-
-  // tags
-  listBookmarkTags: 'promise'
-}

From bb6999de39cc9a1398e0af6a821515e0ca9bdcd3 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 19 Feb 2019 08:53:35 -0600
Subject: [PATCH 092/245] Remove 'published sites'

---
 crawler/index.js                        |   3 -
 crawler/published-sites.js              | 294 ------------------------
 crawler/search.js                       |  62 +----
 dbs/schemas/profile-data.sql.js         |  14 --
 dbs/schemas/profile-data.v24.sql.js     |  14 --
 users/index.js                          |  10 +-
 web-apis/bg/archives.js                 |  35 +--
 web-apis/bg/dat-archive.js              |   4 -
 web-apis/fg/beaker.js                   |   2 -
 web-apis/manifests/internal/archives.js |   2 -
 10 files changed, 3 insertions(+), 437 deletions(-)
 delete mode 100644 crawler/published-sites.js

diff --git a/crawler/index.js b/crawler/index.js
index f826eb96..b0b1b93c 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -9,7 +9,6 @@ const dat = require('../dat')
 const {crawlerEvents, toHostname} = require('./util')
 const linkFeed = require('./link-feed')
 const followgraph = require('./followgraph')
-const publishedSites = require('./published-sites')
 const siteDescriptions = require('./site-descriptions')
 
 // globals
@@ -22,7 +21,6 @@ var watches = {}
 
 exports.linkFeed = linkFeed
 exports.followgraph = followgraph
-exports.publishedSites = publishedSites
 exports.siteDescriptions = siteDescriptions
 const createEventsStream = exports.createEventsStream = () => emitStream(crawlerEvents)
 
@@ -82,7 +80,6 @@ exports.crawlSite = async function (archive) {
     await Promise.all([
       linkFeed.crawlSite(archive, crawlSource),
       followgraph.crawlSite(archive, crawlSource),
-      publishedSites.crawlSite(archive, crawlSource),
       siteDescriptions.crawlSite(archive, crawlSource)
     ])
   } catch (err) {
diff --git a/crawler/published-sites.js b/crawler/published-sites.js
deleted file mode 100644
index 6294bd6d..00000000
--- a/crawler/published-sites.js
+++ /dev/null
@@ -1,294 +0,0 @@
-const assert = require('assert')
-const Events = require('events')
-const Ajv = require('ajv')
-const logger = require('../logger').child({category: 'crawler', dataset: 'published-sites'})
-const db = require('../dbs/profile-data-db')
-const crawler = require('./index')
-const siteDescriptions = require('./site-descriptions')
-const {doCrawl, doCheckpoint, emitProgressEvent, toOrigin, toHostname, ensureDirectory, getMatchingChangesInOrder} = require('./util')
-const publishedSiteSchema = require('./json-schemas/published-site')
-
-// constants
-// =
-
-const TABLE_VERSION = 1
-const JSON_TYPE = 'unwalled.garden/published-site'
-const JSON_PATH_REGEX = /^\/data\/published-sites\/([^/]+)\.json$/i
-
-// typedefs
-// =
-
-/**
- * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
- * @typedef {import('./util').CrawlSourceRecord} CrawlSourceRecord
- * @typedef {import('./site-descriptions').SiteDescription} SiteDescription
- *
- * @typedef {Object} PublishedSites
- * @prop {SiteDescription} author
- * @prop {SiteDescription[]} sites
- *
- * @typedef {Object} PublishedSite
- * @prop {string} pathname
- * @prop {string} url
- * @prop {number} crawledAt
- * @prop {number} createdAt
- * @prop {SiteDescription} author
- */
-
-// globals
-// =
-
-const events = new Events()
-const ajv = (new Ajv())
-const validatePublishedSite = ajv.compile(publishedSiteSchema)
-
-// exported api
-// =
-
-exports.on = events.on.bind(events)
-exports.addListener = events.addListener.bind(events)
-exports.removeListener = events.removeListener.bind(events)
-
-/**
- * @description
- * Crawl the given site for published sites.
- *
- * @param {InternalDatArchive} archive - site to crawl.
- * @param {CrawlSourceRecord} crawlSource - internal metadata about the crawl target.
- * @returns {Promise<void>}
- */
-exports.crawlSite = async function (archive, crawlSource) {
-  return doCrawl(archive, crawlSource, 'crawl_published_sites', TABLE_VERSION, async ({changes, resetRequired}) => {
-    const supressEvents = resetRequired === true // dont emit when replaying old info
-    logger.silly('Crawling published sites', {details: {url: archive.url, numChanges: changes.length, resetRequired}})
-    if (resetRequired) {
-      // reset all data
-      logger.debug('Resetting dataset', {details: {url: archive.url}})
-      await db.run(`
-        DELETE FROM crawl_published_sites WHERE crawlSourceId = ?
-      `, [crawlSource.id])
-      await doCheckpoint('crawl_published_sites', TABLE_VERSION, crawlSource, 0)
-    }
-
-    // collect changed site-records
-    var changedSites = getMatchingChangesInOrder(changes, JSON_PATH_REGEX)
-    if (changedSites.length) {
-      logger.verbose('Collected new/changed published-site files', {details: {url: archive.url, changedSites: changedSites.map(p => p.name)}})
-    } else {
-      logger.debug('No new published-site files found', {details: {url: archive.url}})
-    }
-    emitProgressEvent(archive.url, 'crawl_published_sites', 0, changedSites.length)
-
-    // read and apply each published-site in order
-    var progress = 0
-    for (let changedSite of changedSites) {
-      // TODO Currently the crawler will abort reading the feed if any published-site fails to load
-      //      this means that a single unreachable file can stop the forward progress of published-site indexing
-      //      to solve this, we need to find a way to tolerate unreachable published-site-files without losing our ability to efficiently detect new published-sites
-      //      -prf
-      if (changedSite.type === 'del') {
-        // delete
-        await db.run(`
-          DELETE FROM crawl_published_sites WHERE crawlSourceId = ? AND pathname = ?
-        `, [crawlSource.id, changedSite.name])
-        events.emit('published-site-removed', archive.url)
-      } else {
-        // read
-        let publishedSiteStr
-        try {
-          publishedSiteStr = await archive.pda.readFile(changedSite.name, 'utf8')
-        } catch (err) {
-          logger.warn('Failed to read published-site file, aborting', {details: {url: archive.url, name: changedSite.name, err}})
-          return // abort indexing
-        }
-
-        // parse and validate
-        let publishedSite
-        try {
-          publishedSite = JSON.parse(publishedSiteStr)
-          let valid = validatePublishedSite(publishedSite)
-          if (!valid) throw ajv.errorsText(validatePublishedSite.errors)
-        } catch (err) {
-          logger.warn('Failed to parse post file, skipping', {details: {url: archive.url, name: changedSite.name, err}})
-          continue // skip
-        }
-
-        // massage the published-site
-        publishedSite.createdAt = Number(new Date(publishedSite.createdAt))
-
-        // upsert
-        let existingPost = await get(archive.url, changedSite.name)
-        if (existingPost) {
-          await db.run(`
-            UPDATE crawl_published_sites
-              SET crawledAt = ?, url = ?, createdAt = ?
-              WHERE crawlSourceId = ? AND pathname = ?
-          `, [Date.now(), publishedSite.url, publishedSite.createdAt, crawlSource.id, changedSite.name])
-          events.emit('published-site-updated', archive.url)
-        } else {
-          await db.run(`
-            INSERT INTO crawl_published_sites (crawlSourceId, pathname, crawledAt, url, createdAt)
-              VALUES (?, ?, ?, ?, ?)
-          `, [crawlSource.id, changedSite.name, Date.now(), publishedSite.url, publishedSite.createdAt])
-          events.emit('published-site-added', archive.url)
-        }
-      }
-
-      // checkpoint our progress
-      logger.silly(`Finished crawling published-sites`, {details: {url: archive.url}})
-      await doCheckpoint('crawl_published_sites', TABLE_VERSION, crawlSource, changedSite.version)
-      emitProgressEvent(archive.url, 'crawl_published_sites', ++progress, changedSites.length)
-    }
-  })
-}
-
-/**
- * @description
- * List sites published by publisher.
- *
- * @param {string} publisher - (URL)
- * @param {Object} [opts]
- * @param {string} [opts.type] - filter to the given type.
- * @param {boolean} [opts.includeDesc] - output a site description instead of a simple URL.
- * @returns {Promise<Array<string|SiteDescription>>}
- */
-const listPublishedSites = exports.listPublishedSites = async function (publisher, {type, includeDesc} = {}) {
-  var WHERE = ''
-  var queryParams = [publisher]
-  if (type) {
-    WHERE = `WHERE (',' || type || ',') LIKE ?`
-    queryParams.push(`%,${type},%`)
-  }
-  var rows = await db.all(`
-    SELECT pub.url
-      FROM crawl_published_sites pub
-      INNER JOIN crawl_sources source
-          ON pub.crawlSourceId = source.id
-          AND source.url = ?
-      ${WHERE}
-  `, queryParams)
-  if (!includeDesc) {
-    return rows.map(row => toOrigin(row.url))
-  }
-  return Promise.all(rows.map(async (row) => {
-    return siteDescriptions.getBest({subject: toOrigin(row.url)})
-  }))
-}
-
-/**
- * @description
- * Check for the existence of a published site.
- *
- * @param {string} a - (URL) was this site published by 'b'?
- * @param {string} b - (URL) did this site publish 'a'?
- * @returns {Promise<boolean>}
- */
-const isAPublishedByB = exports.isAPublishedByB = async function (a, b) {
-  a = toOrigin(a)
-  b = toOrigin(b)
-  var res = await db.get(`
-    SELECT pub.url
-      FROM crawl_published_sites pub
-      INNER JOIN crawl_sources source
-          ON pub.crawlSourceId = source.id
-          AND source.url = ?
-      WHERE
-        pub.url = ?
-  `, [b, a])
-  return !!res
-}
-
-/**
- * @description
- * Get crawled published-site.
- *
- * @param {string} url - The URL of the published-site or of the author (if pathname is provided).
- * @param {string} [pathname] - The pathname of the published-site.
- * @returns {Promise<PublishedSite>}
- */
-const get = exports.get = async function (url, pathname = undefined) {
-  // validate & parse params
-  var urlParsed
-  if (url) {
-    try { urlParsed = new URL(url) }
-    catch (e) { throw new Error('Failed to parse published-site URL: ' + url) }
-  }
-  pathname = pathname || urlParsed.pathname
-
-  // execute query
-  return await massagePublishedSiteRow(await db.get(`
-    SELECT
-        crawl_published_sites.*, src.url AS crawlSourceUrl
-      FROM crawl_published_sites
-      INNER JOIN crawl_sources src
-        ON src.id = crawl_published_sites.crawlSourceId
-        AND src.url = ?
-      WHERE
-        crawl_published_sites.pathname = ?
-  `, [urlParsed.origin, pathname]))
-}
-
-/**
- * @description
- * Add a published site to the given archive.
- *
- * @param {InternalDatArchive} archive
- * @param {string} siteUrl
- * @returns {Promise<void>}
- */
-exports.publishSite = async function (archive, siteUrl) {
-  // normalize siteUrl
-  var siteOrigin = toOrigin(siteUrl)
-  var siteHostname = toHostname(siteUrl)
-  assert(typeof siteOrigin === 'string', 'publishSite() must be given a valid URL')
-
-  await ensureDirectory(archive, '/data')
-  await ensureDirectory(archive, '/data/published-sites')
-  await archive.pda.writeFile(`/data/published-sites/${siteHostname}.json`, JSON.stringify({
-    type: JSON_TYPE,
-    url: siteOrigin,
-    createdAt: (new Date()).toISOString()
-  }))
-  await crawler.crawlSite(archive)
-
-  // capture site description
-  /* dont await */siteDescriptions.capture(archive, siteUrl)
-}
-
-/**
- * @description
- * Remove a published site from the given archive.
- *
- * @param {InternalDatArchive} archive
- * @param {string} siteUrl
- * @returns {Promise<void>}
- */
-exports.unpublishSite = async function (archive, siteUrl) {
-  // normalize siteUrl
-  var siteHostname = toHostname(siteUrl)
-  assert(typeof siteHostname === 'string', 'unpublishSite() must be given a valid URL')
-
-  // remove the file
-  await archive.pda.unlink(`/data/published-sites/${siteHostname}.json`)
-  await crawler.crawlSite(archive)
-}
-
-// internal methods
-// =
-
-/**
- * @param {Object} row
- * @returns {Promise<PublishedSite>}
- */
-async function massagePublishedSiteRow (row) {
-  if (!row) return null
-  var author = await siteDescriptions.getBest({subject: row.crawlSourceUrl})
-  if (!author) author = {url: row.crawlSourceUrl}
-  return {
-    pathname: row.pathname,
-    author,
-    url: row.url,
-    crawledAt: row.crawledAt,
-    createdAt: row.createdAt
-  }
-}
diff --git a/crawler/search.js b/crawler/search.js
index bd03a4f0..f561fd38 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -140,7 +140,7 @@ exports.listSuggestions = async function (query = '', opts = {}) {
  * @param {string} opts.user - The current user's URL.
  * @param {string} [opts.query] - The search query.
  * @param {number} [opts.hops=1] - How many hops out in the user's follow graph should be included?
- * @param {string[]} [opts.datasets] - Datasets to query. Defaults to all. Valid values: 'followgraph', 'link_posts', 'published_sites'.
+ * @param {string[]} [opts.datasets] - Datasets to query. Defaults to all. Valid values: 'followgraph', 'link_posts'.
  * @param {string[]} [opts.siteTypes] - Site types to query. Defaults to all.
  * @param {number} [opts.since] - Filter results to items created since the given timestamp.
  * @param {number} [opts.offset]
@@ -257,33 +257,6 @@ exports.listSearchResults = async function (opts) {
       }
     })))
   }
-  if (!datasets || datasets.includes('published_sites')) {
-    // PUBLISHED_SITES
-    let rows = await db.all(buildPublishedSitesSearchQuery({
-      query,
-      crawlSourceIds,
-      userCrawlSourceId,
-      siteTypes,
-      since,
-      limit,
-      offset,
-      startHighlight,
-      endHighlight
-    }))
-    rows = _uniqWith(rows, (a, b) => a.url === b.url) // remove duplicates
-    searchResults.results = searchResults.results.concat(await Promise.all(rows.map(async (row) => {
-      // fetch full records
-      var result = /**@type SiteSearchResult*/(await siteDescriptions.getBest({subject: row.url, author: row.authorUrl}))
-      result.recordType = 'published-site'
-      result.recordFilepath = row.recordFilepath
-      result.author = await siteDescriptions.getBest({subject: row.authorUrl})
-
-      // overwrite title and description so that highlighting can be included
-      if (row.title) result.title = row.title
-      if (row.description) result.description = row.description
-      return result
-    })))
-  }
 
   // sort and apply limit again
   searchResults.results.sort((a, b) => b.crawledAt - a.crawledAt)
@@ -367,39 +340,6 @@ function buildLinkPostsSearchQuery ({query, crawlSourceIds, userCrawlSourceId, s
   return sql
 }
 
-function buildPublishedSitesSearchQuery ({query, crawlSourceIds, userCrawlSourceId, siteTypes, since, limit, offset, startHighlight, endHighlight}) {
-  let sql = knex(query ? 'crawl_site_descriptions_fts_index' : 'crawl_published_sites')
-    .select('crawl_published_sites.url')
-    .select('crawl_published_sites.pathname AS recordFilepath')
-    .select('crawl_sources.url AS authorUrl')
-    .select('crawl_site_descriptions.crawledAt')
-    .where(builder => builder
-      .whereIn('crawl_followgraph.crawlSourceId', crawlSourceIds) // published by someone I follow
-      .orWhere('crawl_published_sites.crawlSourceId', userCrawlSourceId) // or by me
-    )
-    .andWhere('crawl_published_sites.crawledAt', '>=', since)
-    .orderBy('crawl_site_descriptions.crawledAt')
-    .limit(limit)
-    .offset(offset)
-  if (query) {
-    sql = sql
-      .select(knex.raw(`SNIPPET(crawl_site_descriptions_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title`))
-      .select(knex.raw(`SNIPPET(crawl_site_descriptions_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description`))
-      .innerJoin('crawl_site_descriptions', 'crawl_site_descriptions.rowid', '=', 'crawl_site_descriptions_fts_index.rowid')
-      .innerJoin('crawl_published_sites', 'crawl_published_sites.url', '=', 'crawl_site_descriptions.url')
-      .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_published_sites.crawlSourceId')
-      .leftJoin('crawl_followgraph', 'crawl_followgraph.destUrl', '=', 'crawl_sources.url')
-      .whereRaw('crawl_site_descriptions_fts_index MATCH ?', [query])
-  } else {
-    sql = sql
-      .innerJoin('crawl_site_descriptions', 'crawl_site_descriptions.url', '=', 'crawl_published_sites.url')
-      .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_published_sites.crawlSourceId')
-      .leftJoin('crawl_followgraph', 'crawl_followgraph.destUrl', '=', 'crawl_sources.url')
-  }
-  sql = addSiteTypesClause(sql, siteTypes, 'crawl_site_descriptions')
-  return sql
-}
-
 function addSiteTypesClause (sql, siteTypes, table) {
   if (siteTypes && siteTypes.length) {
     sql = sql.where(builder => {
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index 32fbd175..b3a11079 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -202,20 +202,6 @@ CREATE TABLE crawl_followgraph (
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
 
--- crawled site publications
-CREATE TABLE crawl_published_sites (
-  crawlSourceId INTEGER NOT NULL,
-  pathname TEXT NOT NULL,
-  crawledAt INTEGER,
-  
-  url TEXT NOT NULL,
-  createdAt INTEGER,
-  
-  isConfirmedAuthor INTEGER DEFAULT 0,
-
-  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
-);
-
 -- a list of the draft-dats for a master-dat
 -- deprecated
 CREATE TABLE archive_drafts (
diff --git a/dbs/schemas/profile-data.v24.sql.js b/dbs/schemas/profile-data.v24.sql.js
index 1f876ff5..89bc54b8 100644
--- a/dbs/schemas/profile-data.v24.sql.js
+++ b/dbs/schemas/profile-data.v24.sql.js
@@ -98,19 +98,5 @@ CREATE TABLE crawl_followgraph (
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
 
--- crawled site publications
-CREATE TABLE crawl_published_sites (
-  crawlSourceId INTEGER NOT NULL,
-  pathname TEXT NOT NULL,
-  crawledAt INTEGER,
-  
-  url TEXT NOT NULL,
-  createdAt INTEGER,
-  
-  isConfirmedAuthor INTEGER DEFAULT 0,
-
-  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
-);
-
 PRAGMA user_version = 24;
 `
\ No newline at end of file
diff --git a/users/index.js b/users/index.js
index ef16b455..4e5cf133 100644
--- a/users/index.js
+++ b/users/index.js
@@ -2,7 +2,6 @@ const Events = require('events')
 const logger = require('../logger').category('crawler')
 const dat = require('../dat')
 const crawler = require('../crawler')
-const publishedSites = require('../crawler/published-sites')
 const followgraph = require('../crawler/followgraph')
 const db = require('../dbs/profile-data-db')
 const archivesDb = require('../dbs/archives')
@@ -216,8 +215,7 @@ async function isUser (url) {
  *
  *  1. Self
  *  2. Followed sites
- *  3. Published sites
- *  4. FoaFs
+ *  3. FoaFs
  *
  * The sites will be ordered by these priorities and then iterated linearly. The ordering within
  * the priority groupings will be according to URL for a deterministic but effectively random ordering.
@@ -235,15 +233,9 @@ async function selectNextCrawlTargets (user) {
   // get followed sites
   rows = rows.concat(await followgraph.listFollows(user.url))
 
-  // get sites published
-  rows = rows.concat(await publishedSites.listPublishedSites(user.url))
-
   // get sites followed by followed sites
   rows = rows.concat(await followgraph.listFoaFs(user.url))
 
-  // get sites published by followed sites
-  // TODO
-
   // assemble into list
   var start = user.crawlSelectorCursor || 0
   if (start > rows.length) start = 0
diff --git a/web-apis/bg/archives.js b/web-apis/bg/archives.js
index b5700039..aee18343 100644
--- a/web-apis/bg/archives.js
+++ b/web-apis/bg/archives.js
@@ -9,7 +9,6 @@ const datLibrary = require('../../dat/library')
 const datGC = require('../../dat/garbage-collector')
 const archivesDb = require('../../dbs/archives')
 const archiveDraftsDb = require('../../dbs/archive-drafts')
-const publishedSites  = require('../../crawler/published-sites')
 const {cbPromise} = require('../../lib/functions')
 const {timer} = require('../../lib/time')
 const lock = require('../../lib/lock')
@@ -52,31 +51,6 @@ module.exports = {
     return archivesDb.setUserSettings(0, key, opts)
   },
 
-  async publish (url) {
-    url = getOrigin(url)
-    assertString(url, 'Parameter one must be a URL')
-    var userSession = globals.userSessionAPI.getFor(this.sender)
-    if (!userSession) throw new Error('No active user session')
-    var userArchive = datLibrary.getArchive(userSession.url)
-
-    // ensure archive is owned and saved by the user
-    var info = await datLibrary.getArchiveInfo(url)
-    if (!info.isOwner) throw new Error('Must be the author of the site to publish it')
-    if (!info.userSettings.isSaved) throw new Error('Site must be saved to publish it')
-
-    return publishedSites.publishSite(userArchive, url)
-  },
-
-  async unpublish (url) {
-    url = getOrigin(url)
-    assertString(url, 'Parameter one must be a URL')
-    var userSession = globals.userSessionAPI.getFor(this.sender)
-    if (!userSession) throw new Error('No active user session')
-    var userArchive = datLibrary.getArchive(userSession.url)
-
-    return publishedSites.unpublishSite(userArchive, url)
-  },
-
   async remove (url) {
     var key = datLibrary.fromURLToKey(url)
     return archivesDb.setUserSettings(0, key, {isSaved: false})
@@ -112,14 +86,7 @@ module.exports = {
   },
 
   async list (query = {}) {
-    var userSession = globals.userSessionAPI.getFor(this.sender)
-    var archives = await datLibrary.queryArchives(query)
-    if (userSession) {
-      await Promise.all(archives.map(async (a) => {
-        a.isPublished = await publishedSites.isAPublishedByB(a.url, userSession.url)
-      }))
-    }
-    return archives
+    return datLibrary.queryArchives(query)
   },
 
   // folder sync
diff --git a/web-apis/bg/dat-archive.js b/web-apis/bg/dat-archive.js
index 25dc6915..184b230a 100644
--- a/web-apis/bg/dat-archive.js
+++ b/web-apis/bg/dat-archive.js
@@ -5,7 +5,6 @@ const parseDatURL = require('parse-dat-url')
 const pda = require('pauls-dat-api')
 const concat = require('concat-stream')
 const pick = require('lodash.pick')
-const publishedSites  = require('../../crawler/published-sites')
 const datDns = require('../../dat/dns')
 const datLibrary = require('../../dat/library')
 const archivesDb = require('../../dbs/archives')
@@ -149,9 +148,6 @@ module.exports = {
 
       // request from beaker internal sites: give all data
       if (this.sender.getURL().startsWith('beaker:')) {
-        // add publish information
-        var userSession = globals.userSessionAPI.getFor(this.sender)
-        info.isPublished = await publishedSites.isAPublishedByB(url, userSession.url)
         // check that the local sync path is valid
         if (info && info.userSettings.localSyncPath) {
           const stat = await new Promise(resolve => {
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index 6725ae79..82bc18bc 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -42,8 +42,6 @@ exports.setup = function (rpc) {
     beaker.archives = new EventTarget()
     beaker.archives.status = archivesRPC.status
     beaker.archives.add = archivesRPC.add
-    beaker.archives.publish = archivesRPC.publish
-    beaker.archives.unpublish = archivesRPC.unpublish
     beaker.archives.setUserSettings = archivesRPC.setUserSettings
     beaker.archives.remove = archivesRPC.remove
     beaker.archives.bulkRemove = archivesRPC.bulkRemove
diff --git a/web-apis/manifests/internal/archives.js b/web-apis/manifests/internal/archives.js
index 5ee6a972..d6eecebc 100644
--- a/web-apis/manifests/internal/archives.js
+++ b/web-apis/manifests/internal/archives.js
@@ -5,8 +5,6 @@ module.exports = {
   // local cache management and querying
   setUserSettings: 'promise',
   add: 'promise',
-  publish: 'promise',
-  unpublish: 'promise',
   remove: 'promise',
   bulkRemove: 'promise',
   delete: 'promise',

From 500bb6fd45bb65b1eb373e990c25641b78249dd0 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 19 Feb 2019 09:15:09 -0600
Subject: [PATCH 093/245] Replace link-posts with posts

---
 crawler/{link-feed.js => feed.js}             | 107 ++++++++----------
 crawler/index.js                              |   6 +-
 crawler/json-schemas/comment.js               |  10 +-
 crawler/json-schemas/content.js               |  66 -----------
 crawler/json-schemas/link-post.js             |  59 ----------
 .../json-schemas/{micro-post.js => post.js}   |  29 ++---
 crawler/json-schemas/published-site.js        |  33 ------
 crawler/search.js                             |  50 ++++----
 dbs/schemas/profile-data.sql.js               |  27 ++---
 dbs/schemas/profile-data.v24.sql.js           |  25 ++--
 scripts/import-schemas.js                     |   5 +-
 web-apis/bg.js                                |   6 +-
 web-apis/bg/link-feed.js                      |  12 +-
 web-apis/fg/beaker.js                         |  18 +--
 14 files changed, 138 insertions(+), 315 deletions(-)
 rename crawler/{link-feed.js => feed.js} (72%)
 delete mode 100644 crawler/json-schemas/content.js
 delete mode 100644 crawler/json-schemas/link-post.js
 rename crawler/json-schemas/{micro-post.js => post.js} (53%)
 delete mode 100644 crawler/json-schemas/published-site.js

diff --git a/crawler/link-feed.js b/crawler/feed.js
similarity index 72%
rename from crawler/link-feed.js
rename to crawler/feed.js
index f77e06bc..c2e25e1d 100644
--- a/crawler/link-feed.js
+++ b/crawler/feed.js
@@ -2,19 +2,19 @@ const assert = require('assert')
 const {URL} = require('url')
 const Events = require('events')
 const Ajv = require('ajv')
-const logger = require('../logger').child({category: 'crawler', dataset: 'link-posts'})
+const logger = require('../logger').child({category: 'crawler', dataset: 'posts'})
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
 const siteDescriptions = require('./site-descriptions')
 const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename, ensureDirectory, toOrigin} = require('./util')
-const linkPostSchema = require('./json-schemas/link-post')
+const postSchema = require('./json-schemas/post')
 
 // constants
 // =
 
 const TABLE_VERSION = 1
-const JSON_TYPE = 'unwalled.garden/link-post'
-const JSON_PATH_REGEX = /^\/data\/link-feed\/([^/]+)\.json$/i
+const JSON_TYPE = 'unwalled.garden/post'
+const JSON_PATH_REGEX = /^\/data\/feed\/([^/]+)\.json$/i
 
 // typedefs
 // =
@@ -27,10 +27,7 @@ const JSON_PATH_REGEX = /^\/data\/link-feed\/([^/]+)\.json$/i
  * @typedef {Object} Post
  * @prop {string} pathname
  * @prop {Object} content
- * @prop {string} content.url
- * @prop {string} content.title
- * @prop {string} [content.description]
- * @prop {string|string[]} [content.type]
+ * @prop {string} content.body
  * @prop {number} crawledAt
  * @prop {number} createdAt
  * @prop {number} updatedAt
@@ -42,8 +39,8 @@ const JSON_PATH_REGEX = /^\/data\/link-feed\/([^/]+)\.json$/i
 
 const events = new Events()
 const ajv = (new Ajv())
-const validateLinkPost = ajv.compile(linkPostSchema)
-const validateLinkPostContent = ajv.compile(linkPostSchema.properties.content)
+const validatePost = ajv.compile(postSchema)
+const validatePostContent = ajv.compile(postSchema.properties.content)
 
 // exported api
 // =
@@ -61,16 +58,16 @@ exports.removeListener = events.removeListener.bind(events)
  * @returns {Promise}
  */
 exports.crawlSite = async function (archive, crawlSource) {
-  return doCrawl(archive, crawlSource, 'crawl_link_posts', TABLE_VERSION, async ({changes, resetRequired}) => {
+  return doCrawl(archive, crawlSource, 'crawl_posts', TABLE_VERSION, async ({changes, resetRequired}) => {
     const supressEvents = resetRequired === true // dont emit when replaying old info
     logger.silly('Crawling posts', {details: {url: archive.url, numChanges: changes.length, resetRequired}})
     if (resetRequired) {
       // reset all data
       logger.debug('Resetting dataset', {details: {url: archive.url}})
       await db.run(`
-        DELETE FROM crawl_link_posts WHERE crawlSourceId = ?
+        DELETE FROM crawl_posts WHERE crawlSourceId = ?
       `, [crawlSource.id])
-      await doCheckpoint('crawl_link_posts', TABLE_VERSION, crawlSource, 0)
+      await doCheckpoint('crawl_posts', TABLE_VERSION, crawlSource, 0)
     }
 
     // collect changed posts
@@ -80,7 +77,7 @@ exports.crawlSite = async function (archive, crawlSource) {
     } else {
       logger.debug('No new post-files found', {details: {url: archive.url}})
     }
-    emitProgressEvent(archive.url, 'crawl_link_posts', 0, changedPosts.length)
+    emitProgressEvent(archive.url, 'crawl_posts', 0, changedPosts.length)
 
     // read and apply each post in order
     var progress = 0
@@ -92,7 +89,7 @@ exports.crawlSite = async function (archive, crawlSource) {
       if (changedPost.type === 'del') {
         // delete
         await db.run(`
-          DELETE FROM crawl_link_posts WHERE crawlSourceId = ? AND pathname = ?
+          DELETE FROM crawl_posts WHERE crawlSourceId = ? AND pathname = ?
         `, [crawlSource.id, changedPost.name])
         events.emit('post-removed', archive.url)
       } else {
@@ -109,16 +106,14 @@ exports.crawlSite = async function (archive, crawlSource) {
         let post
         try {
           post = JSON.parse(postString)
-          let valid = validateLinkPost(post)
-          if (!valid) throw ajv.errorsText(validateLinkPost.errors)
+          let valid = validatePost(post)
+          if (!valid) throw ajv.errorsText(validatePost.errors)
         } catch (err) {
           logger.warn('Failed to parse post file, skipping', {details: {url: archive.url, name: changedPost.name, err}})
           continue // skip
         }
 
         // massage the post
-        post.content.description = post.content.description || '' // optional
-        post.content.type = (post.content.type || ['']).join(',') // optional
         post.createdAt = Number(new Date(post.createdAt))
         post.updatedAt = Number(new Date(post.updatedAt))
         if (isNaN(post.updatedAt)) post.updatedAt = 0 // optional
@@ -127,24 +122,24 @@ exports.crawlSite = async function (archive, crawlSource) {
         let existingPost = await get(archive.url, changedPost.name)
         if (existingPost) {
           await db.run(`
-            UPDATE crawl_link_posts
-              SET crawledAt = ?, url = ?, title = ?, description = ?, type = ?, createdAt = ?, updatedAt = ?
+            UPDATE crawl_posts
+              SET crawledAt = ?, body = ?, createdAt = ?, updatedAt = ?
               WHERE crawlSourceId = ? AND pathname = ?
-          `, [Date.now(), post.content.url, post.content.title, post.content.description, post.content.type, post.createdAt, post.updatedAt, crawlSource.id, changedPost.name])
+          `, [Date.now(), post.content.body, post.createdAt, post.updatedAt, crawlSource.id, changedPost.name])
           events.emit('post-updated', archive.url)
         } else {
           await db.run(`
-            INSERT INTO crawl_link_posts (crawlSourceId, pathname, crawledAt, url, title, description, type, createdAt, updatedAt)
-              VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?)
-          `, [crawlSource.id, changedPost.name, Date.now(), post.content.url, post.content.title, post.content.description, post.content.type, post.createdAt, post.updatedAt])
+            INSERT INTO crawl_posts (crawlSourceId, pathname, crawledAt, body, createdAt, updatedAt)
+              VALUES (?, ?, ?, ?, ?, ?)
+          `, [crawlSource.id, changedPost.name, Date.now(), post.content.body, post.createdAt, post.updatedAt])
           events.emit('post-added', archive.url)
         }
       }
 
       // checkpoint our progress
       logger.silly(`Finished crawling posts`, {details: {url: archive.url}})
-      await doCheckpoint('crawl_link_posts', TABLE_VERSION, crawlSource, changedPost.version)
-      emitProgressEvent(archive.url, 'crawl_link_posts', ++progress, changedPosts.length)
+      await doCheckpoint('crawl_posts', TABLE_VERSION, crawlSource, changedPost.version)
+      emitProgressEvent(archive.url, 'crawl_posts', ++progress, changedPosts.length)
     }
   })
 }
@@ -180,8 +175,8 @@ exports.list = async function ({offset, limit, reverse, author, authors} = {}) {
 
   // build query
   var query = `
-    SELECT crawl_link_posts.*, src.url AS crawlSourceUrl FROM crawl_link_posts
-      INNER JOIN crawl_sources src ON src.id = crawl_link_posts.crawlSourceId
+    SELECT crawl_posts.*, src.url AS crawlSourceUrl FROM crawl_posts
+      INNER JOIN crawl_sources src ON src.id = crawl_posts.crawlSourceId
   `
   var values = []
   if (authors) {
@@ -230,13 +225,13 @@ const get = exports.get = async function (url, pathname = undefined) {
   // execute query
   return await massagePostRow(await db.get(`
     SELECT
-        crawl_link_posts.*, src.url AS crawlSourceUrl
-      FROM crawl_link_posts
+        crawl_posts.*, src.url AS crawlSourceUrl
+      FROM crawl_posts
       INNER JOIN crawl_sources src
-        ON src.id = crawl_link_posts.crawlSourceId
+        ON src.id = crawl_posts.crawlSourceId
         AND src.url = ?
       WHERE
-        crawl_link_posts.pathname = ?
+        crawl_posts.pathname = ?
   `, [urlParsed.origin, pathname]))
 }
 
@@ -246,28 +241,17 @@ const get = exports.get = async function (url, pathname = undefined) {
  *
  * @param {InternalDatArchive} archive - where to write the post to.
  * @param {Object} content
- * @param {string} content.url
- * @param {string} content.title
- * @param {string} [content.description]
- * @param {string|string[]} [content.type]
+ * @param {string} content.body
  * @returns {Promise}
  */
 exports.create = async function (archive, content) {
-  var valid = validateLinkPostContent(content)
-  if (!valid) throw ajv.errorsText(validateLinkPostContent.errors)
-
-  if (!content.type) {
-    // try to fetch type
-    let desc = await siteDescriptions.getBest({subject: content.url})
-    if (desc && desc.type) {
-      content.type = desc.type
-    }
-  }
+  var valid = validatePostContent(content)
+  if (!valid) throw ajv.errorsText(validatePostContent.errors)
 
   var filename = generateTimeFilename()
   await ensureDirectory(archive, '/data')
-  await ensureDirectory(archive, '/data/link-feed')
-  await archive.pda.writeFile(`/data/link-feed/${filename}.json`, JSON.stringify({
+  await ensureDirectory(archive, '/data/feed')
+  await archive.pda.writeFile(`/data/feed/${filename}.json`, JSON.stringify({
     type: JSON_TYPE,
     content,
     createdAt: (new Date()).toISOString()
@@ -282,15 +266,12 @@ exports.create = async function (archive, content) {
  * @param {InternalDatArchive} archive - where to write the post to.
  * @param {string} pathname - the pathname of the post.
  * @param {Object} content
- * @param {string} content.url
- * @param {string} content.title
- * @param {string} [content.description]
- * @param {string|string[]} [content.type]
+ * @param {string} content.body
  * @returns {Promise}
  */
 exports.edit = async function (archive, pathname, content) {
-  var valid = validateLinkPostContent(content)
-  if (!valid) throw ajv.errorsText(validateLinkPostContent.errors)
+  var valid = validatePostContent(content)
+  if (!valid) throw ajv.errorsText(validatePostContent.errors)
   var oldJson = JSON.parse(await archive.pda.readFile(pathname))
   await archive.pda.writeFile(pathname, JSON.stringify({
     type: JSON_TYPE,
@@ -333,15 +314,21 @@ function isString (v) {
 async function massagePostRow (row) {
   if (!row) return null
   var author = await siteDescriptions.getBest({subject: row.crawlSourceUrl})
-  if (!author) author = {url: row.crawlSourceUrl}
+  if (!author) {
+    author = {
+      url: row.crawlSourceUrl,
+      title: '',
+      description: '',
+      type: [],
+      thumbUrl: `${row.crawlSourceUrl}/thumb`,
+      descAuthor: {url: null}
+    }
+  }
   return {
     pathname: row.pathname,
     author,
     content: {
-      url: row.url,
-      title: row.title,
-      description: row.description,
-      type: row.type.split(',')
+      body: row.body
     },
     crawledAt: row.crawledAt,
     createdAt: row.createdAt,
diff --git a/crawler/index.js b/crawler/index.js
index b0b1b93c..a50bb39e 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -7,7 +7,7 @@ const archivesDb = require('../dbs/archives')
 const dat = require('../dat')
 
 const {crawlerEvents, toHostname} = require('./util')
-const linkFeed = require('./link-feed')
+const feed = require('./feed')
 const followgraph = require('./followgraph')
 const siteDescriptions = require('./site-descriptions')
 
@@ -19,7 +19,7 @@ var watches = {}
 // exported api
 // =
 
-exports.linkFeed = linkFeed
+exports.feed = feed
 exports.followgraph = followgraph
 exports.siteDescriptions = siteDescriptions
 const createEventsStream = exports.createEventsStream = () => emitStream(crawlerEvents)
@@ -78,7 +78,7 @@ exports.crawlSite = async function (archive) {
 
     // crawl individual sources
     await Promise.all([
-      linkFeed.crawlSite(archive, crawlSource),
+      feed.crawlSite(archive, crawlSource),
       followgraph.crawlSite(archive, crawlSource),
       siteDescriptions.crawlSite(archive, crawlSource)
     ])
diff --git a/crawler/json-schemas/comment.js b/crawler/json-schemas/comment.js
index 3e37dd7a..73a62282 100644
--- a/crawler/json-schemas/comment.js
+++ b/crawler/json-schemas/comment.js
@@ -33,8 +33,14 @@ module.exports = {
       ]
     },
     'content': {
-      'type': 'string',
-      'title': "The comment's content"
+      'type': 'object',
+      'required': ['body'],
+      'properties': {
+        'body': {
+          'type': 'string',
+          'title': "The post's text content"
+        }
+      }
     },
     'createdAt': {
       'type': 'string',
diff --git a/crawler/json-schemas/content.js b/crawler/json-schemas/content.js
deleted file mode 100644
index b1b898e8..00000000
--- a/crawler/json-schemas/content.js
+++ /dev/null
@@ -1,66 +0,0 @@
-module.exports = {
-  '$schema': 'http://json-schema.org/draft-07/schema#',
-  '$id': 'dat://unwalled.garden/content.json',
-  'type': 'object',
-  'title': 'Content',
-  'description': 'A description of media content.',
-  'required': [
-    'type'
-  ],
-  'properties': {
-    'type': {
-      'type': 'string',
-      'title': "The object's type",
-      'const': 'unwalled.garden/content'
-    },
-    'item': {
-      'type': 'object',
-      'required': [
-        'filename'
-      ],
-      'properties': {
-        'filename': {
-          'type': 'string',
-          'examples': [
-            'dat://beakerbrowser.com'
-          ]
-        },
-        'title': {
-          'type': 'string'
-        },
-        'description': {
-          'type': 'string'
-        }
-      }
-    },
-    'items': {
-      'type': 'array',
-      'items': {
-        'type': 'object',
-        'required': [
-          'filename'
-        ],
-        'properties': {
-          'filename': {
-            'type': 'string',
-            'examples': [
-              'dat://beakerbrowser.com'
-            ]
-          },
-          'title': {
-            'type': 'string'
-          },
-          'description': {
-            'type': 'string'
-          }
-        }
-      }
-    },
-    'createdAt': {
-      'type': 'string',
-      'format': 'date-time',
-      'title': "The time of this content's creation"
-    }
-  },
-  'additionalProperties': false
-}
\ No newline at end of file
diff --git a/crawler/json-schemas/link-post.js b/crawler/json-schemas/link-post.js
deleted file mode 100644
index f210e65b..00000000
--- a/crawler/json-schemas/link-post.js
+++ /dev/null
@@ -1,59 +0,0 @@
-module.exports = {
-  '$schema': 'http://json-schema.org/draft-07/schema#',
-  '$id': 'dat://unwalled.garden/link-post.json',
-  'type': 'object',
-  'title': 'Link Post',
-  'description': 'A published link to some content.',
-  'required': [
-    'type',
-    'content',
-    'createdAt'
-  ],
-  'properties': {
-    'type': {
-      'type': 'string',
-      'title': "The object's type",
-      'const': 'unwalled.garden/link-post'
-    },
-    'content': {
-      'type': 'object',
-      'required': [
-        'url',
-        'title'
-      ],
-      'properties': {
-        'url': {
-          'type': 'string',
-          'title': "The post's target URL",
-          'format': 'uri',
-          'examples': [
-            'dat://beakerbrowser.com'
-          ]
-        },
-        'title': {
-          'type': 'string'
-        },
-        'description': {
-          'type': 'string'
-        },
-        'type': {
-          'type': 'array',
-          'items': {
-            'type': 'string'
-          }
-        }
-      }
-    },
-    'createdAt': {
-      'type': 'string',
-      'format': 'date-time',
-      'title': "The time of this post's creation"
-    },
-    'updatedAt': {
-      'type': 'string',
-      'format': 'date-time',
-      'title': "The time of this post's last edit"
-    }
-  },
-  'additionalProperties': false
-}
\ No newline at end of file
diff --git a/crawler/json-schemas/micro-post.js b/crawler/json-schemas/post.js
similarity index 53%
rename from crawler/json-schemas/micro-post.js
rename to crawler/json-schemas/post.js
index 713f2c44..08a5ee85 100644
--- a/crawler/json-schemas/micro-post.js
+++ b/crawler/json-schemas/post.js
@@ -1,24 +1,26 @@
 module.exports = {
   '$schema': 'http://json-schema.org/draft-07/schema#',
-  '$id': 'dat://unwalled.garden/micro-post.json',
+  '$id': 'dat://unwalled.garden/post.json',
   'type': 'object',
-  'title': 'Micro Post',
-  'description': 'A short text post.',
-  'required': [
-    'type',
-    'content',
-    'createdAt'
-  ],
+  'title': 'Post',
+  'description': 'A broadcasted piece of content.',
+  'required': ['type', 'content', 'createdAt'],
   'properties': {
     'type': {
       'type': 'string',
       'title': "The object's type",
-      'const': 'unwalled.garden/micro-post'
+      'const': 'unwalled.garden/post'
     },
     'content': {
-      'type': 'string',
-      'title': "The post's content",
-      'maxLength': 280
+      'type': 'object',
+      'required': ['body'],
+      'properties': {
+        'body': {
+          'type': 'string',
+          'title': "The post's text body",
+          'maxLength': 280
+        }
+      }
     },
     'createdAt': {
       'type': 'string',
@@ -30,6 +32,5 @@ module.exports = {
       'format': 'date-time',
       'title': "The time of this post's last edit"
     }
-  },
-  'additionalProperties': false
+  }
 }
\ No newline at end of file
diff --git a/crawler/json-schemas/published-site.js b/crawler/json-schemas/published-site.js
deleted file mode 100644
index 49c095e7..00000000
--- a/crawler/json-schemas/published-site.js
+++ /dev/null
@@ -1,33 +0,0 @@
-module.exports = {
-  '$schema': 'http://json-schema.org/draft-07/schema#',
-  '$id': 'dat://unwalled.garden/published-site.json',
-  'type': 'object',
-  'title': 'Published site',
-  'description': 'A site which has been published by the user.',
-  'required': [
-    'type',
-    'url',
-    'createdAt'
-  ],
-  'properties': {
-    'type': {
-      'type': 'string',
-      'title': "The object's type",
-      'const': 'unwalled.garden/published-site'
-    },
-    'url': {
-      'type': 'string',
-      'title': "The published site's URL",
-      'format': 'uri',
-      'examples': [
-        'dat://beakerbrowser.com'
-      ]
-    },
-    'createdAt': {
-      'type': 'string',
-      'format': 'date-time',
-      'title': "The time of this site's publishing"
-    }
-  },
-  'additionalProperties': false
-}
\ No newline at end of file
diff --git a/crawler/search.js b/crawler/search.js
index f561fd38..4b7bb875 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -140,7 +140,7 @@ exports.listSuggestions = async function (query = '', opts = {}) {
  * @param {string} opts.user - The current user's URL.
  * @param {string} [opts.query] - The search query.
  * @param {number} [opts.hops=1] - How many hops out in the user's follow graph should be included?
- * @param {string[]} [opts.datasets] - Datasets to query. Defaults to all. Valid values: 'followgraph', 'link_posts'.
+ * @param {string[]} [opts.datasets] - Datasets to query. Defaults to all. Valid values: 'followgraph', 'posts'.
  * @param {string[]} [opts.siteTypes] - Site types to query. Defaults to all.
  * @param {number} [opts.since] - Filter results to items created since the given timestamp.
  * @param {number} [opts.offset]
@@ -222,9 +222,9 @@ exports.listSearchResults = async function (opts) {
     }))
     searchResults.results = searchResults.results.concat(rows)
   }
-  if (!datasets || datasets.includes('link_posts')) {
-    // LINK_POSTS
-    let rows = await db.all(buildLinkPostsSearchQuery({
+  if (!datasets || datasets.includes('posts')) {
+    // POSTS
+    let rows = await db.all(buildPostsSearchQuery({
       query,
       crawlSourceIds,
       userCrawlSourceId,
@@ -241,7 +241,7 @@ exports.listSearchResults = async function (opts) {
 
       // massage attrs
       return {
-        recordType: 'link-post',
+        recordType: 'post',
         recordFilepath: p.recordFilepath,
         url: p.authorUrl + p.pathname,
         author,
@@ -303,40 +303,36 @@ function buildFollowGraphSearchQuery ({query, crawlSourceIds, user, userCrawlSou
   return sql
 }
 
-function buildLinkPostsSearchQuery ({query, crawlSourceIds, userCrawlSourceId, siteTypes, since, limit, offset, startHighlight, endHighlight}) {
-  let sql = knex(query ? 'crawl_link_posts_fts_index' : 'crawl_link_posts')
-    .select('crawl_link_posts.url')
-    .select('crawl_link_posts.type')
-    .select('crawl_link_posts.pathname')
-    .select('crawl_link_posts.crawledAt')
-    .select('crawl_link_posts.createdAt')
-    .select('crawl_link_posts.updatedAt')
-    .select('crawl_link_posts.pathname AS recordFilepath')
+function buildPostsSearchQuery ({query, crawlSourceIds, userCrawlSourceId, siteTypes, since, limit, offset, startHighlight, endHighlight}) {
+  let sql = knex(query ? 'crawl_posts_fts_index' : 'crawl_posts')
+    .select('crawl_posts.pathname')
+    .select('crawl_posts.crawledAt')
+    .select('crawl_posts.createdAt')
+    .select('crawl_posts.updatedAt')
+    .select('crawl_posts.pathname AS recordFilepath')
     .select('crawl_sources.url AS authorUrl')
     .where(builder => builder
       .whereIn('crawl_followgraph.crawlSourceId', crawlSourceIds) // published by someone I follow
-      .orWhere('crawl_link_posts.crawlSourceId', userCrawlSourceId) // or by me
+      .orWhere('crawl_posts.crawlSourceId', userCrawlSourceId) // or by me
     )
-    .andWhere('crawl_link_posts.crawledAt', '>=', since)
-    .orderBy('crawl_link_posts.crawledAt')
+    .andWhere('crawl_posts.crawledAt', '>=', since)
+    .orderBy('crawl_posts.crawledAt')
     .limit(limit)
     .offset(offset)
   if (query) {
     sql = sql
-      .select(knex.raw(`SNIPPET(crawl_link_posts_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title`))
-      .select(knex.raw(`SNIPPET(crawl_link_posts_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description`))
-      .innerJoin('crawl_link_posts', 'crawl_link_posts.rowid', '=', 'crawl_link_posts_fts_index.rowid')
-      .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_link_posts.crawlSourceId')
+      .select(knex.raw(`SNIPPET(crawl_posts_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS body`))
+      .innerJoin('crawl_posts', 'crawl_posts.rowid', '=', 'crawl_posts_fts_index.rowid')
+      .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_posts.crawlSourceId')
       .leftJoin('crawl_followgraph', 'crawl_followgraph.destUrl', '=', 'crawl_sources.url')
-      .whereRaw('crawl_link_posts_fts_index MATCH ?', [query])
+      .whereRaw('crawl_posts_fts_index MATCH ?', [query])
   } else {
     sql = sql
-      .select('crawl_link_posts.title')
-      .select('crawl_link_posts.description')
-      .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_link_posts.crawlSourceId')
-      .leftJoin('crawl_followgraph', 'crawl_followgraph.destUrl', '=', 'crawl_link_posts.url')
+      .select('crawl_posts.body')
+      .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_posts.crawlSourceId')
+      .leftJoin('crawl_followgraph', 'crawl_followgraph.destUrl', '=', 'crawl_posts.url')
   }
-  sql = addSiteTypesClause(sql, siteTypes, 'crawl_link_posts')
+  sql = addSiteTypesClause(sql, siteTypes, 'crawl_posts')
   return sql
 }
 
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index b3a11079..d103d981 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -162,33 +162,30 @@ CREATE TRIGGER crawl_site_descriptions_au AFTER UPDATE ON crawl_site_description
   INSERT INTO crawl_site_descriptions_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
 END;
 
--- crawled link-posts
-CREATE TABLE crawl_link_posts (
+-- crawled posts
+CREATE TABLE crawl_posts (
   crawlSourceId INTEGER NOT NULL,
   pathname TEXT NOT NULL,
   crawledAt INTEGER,
 
-  url TEXT,
-  title TEXT,
-  description TEXT,
-  type TEXT, -- comma separated strings
+  body TEXT,
   createdAt INTEGER,
   updatedAt INTEGER,
 
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
-CREATE VIRTUAL TABLE crawl_link_posts_fts_index USING fts5(title, description, content='crawl_link_posts');
+CREATE VIRTUAL TABLE crawl_posts_fts_index USING fts5(body, content='crawl_posts');
 
--- triggers to keep crawl_link_posts_fts_index updated
-CREATE TRIGGER crawl_link_posts_ai AFTER INSERT ON crawl_link_posts BEGIN
-  INSERT INTO crawl_link_posts_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
+-- triggers to keep crawl_posts_fts_index updated
+CREATE TRIGGER crawl_posts_ai AFTER INSERT ON crawl_posts BEGIN
+  INSERT INTO crawl_posts_fts_index(rowid, body) VALUES (new.rowid, new.body);
 END;
-CREATE TRIGGER crawl_link_posts_ad AFTER DELETE ON crawl_link_posts BEGIN
-  INSERT INTO crawl_link_posts_fts_index(crawl_link_posts_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
+CREATE TRIGGER crawl_posts_ad AFTER DELETE ON crawl_posts BEGIN
+  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, body) VALUES('delete', old.rowid, old.body);
 END;
-CREATE TRIGGER crawl_link_posts_au AFTER UPDATE ON crawl_link_posts BEGIN
-  INSERT INTO crawl_link_posts_fts_index(crawl_link_posts_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
-  INSERT INTO crawl_link_posts_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
+CREATE TRIGGER crawl_posts_au AFTER UPDATE ON crawl_posts BEGIN
+  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, body) VALUES('delete', old.rowid, old.body);
+  INSERT INTO crawl_posts_fts_index(rowid, body) VALUES (new.rowid, new.body);
 END;
 
 -- crawled follows
diff --git a/dbs/schemas/profile-data.v24.sql.js b/dbs/schemas/profile-data.v24.sql.js
index 89bc54b8..0f6f8b66 100644
--- a/dbs/schemas/profile-data.v24.sql.js
+++ b/dbs/schemas/profile-data.v24.sql.js
@@ -59,32 +59,29 @@ CREATE TRIGGER crawl_site_descriptions_au AFTER UPDATE ON crawl_site_description
 END;
 
 -- crawled posts
-CREATE TABLE crawl_link_posts (
+CREATE TABLE crawl_posts (
   crawlSourceId INTEGER NOT NULL,
   pathname TEXT NOT NULL,
   crawledAt INTEGER,
 
-  url TEXT,
-  title TEXT,
-  description TEXT,
-  type TEXT, -- comma separated strings
+  body TEXT,
   createdAt INTEGER,
   updatedAt INTEGER,
 
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
-CREATE VIRTUAL TABLE crawl_link_posts_fts_index USING fts5(title, description, content='crawl_link_posts');
+CREATE VIRTUAL TABLE crawl_posts_fts_index USING fts5(body, content='crawl_posts');
 
--- triggers to keep crawl_link_posts_fts_index updated
-CREATE TRIGGER crawl_link_posts_ai AFTER INSERT ON crawl_link_posts BEGIN
-  INSERT INTO crawl_link_posts_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
+-- triggers to keep crawl_posts_fts_index updated
+CREATE TRIGGER crawl_posts_ai AFTER INSERT ON crawl_posts BEGIN
+  INSERT INTO crawl_posts_fts_index(rowid, body) VALUES (new.rowid, new.body);
 END;
-CREATE TRIGGER crawl_link_posts_ad AFTER DELETE ON crawl_link_posts BEGIN
-  INSERT INTO crawl_link_posts_fts_index(crawl_link_posts_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
+CREATE TRIGGER crawl_posts_ad AFTER DELETE ON crawl_posts BEGIN
+  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, body) VALUES('delete', old.rowid, old.body);
 END;
-CREATE TRIGGER crawl_link_posts_au AFTER UPDATE ON crawl_link_posts BEGIN
-  INSERT INTO crawl_link_posts_fts_index(crawl_link_posts_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
-  INSERT INTO crawl_link_posts_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
+CREATE TRIGGER crawl_posts_au AFTER UPDATE ON crawl_posts BEGIN
+  INSERT INTO crawl_posts_fts_index(crawl_posts_fts_index, rowid, body) VALUES('delete', old.rowid, old.body);
+  INSERT INTO crawl_posts_fts_index(rowid, body) VALUES (new.rowid, new.body);
 END;
 
 -- crawled follows
diff --git a/scripts/import-schemas.js b/scripts/import-schemas.js
index 764cd7fe..709866cf 100644
--- a/scripts/import-schemas.js
+++ b/scripts/import-schemas.js
@@ -5,11 +5,8 @@ const rimraf = require('rimraf')
 
 const SCHEMAS = [
   'comment',
-  'content',
   'follows',
-  'link-post',
-  'micro-post',
-  'published-site'
+  'post'
 ]
 
 console.log('')
diff --git a/web-apis/bg.js b/web-apis/bg.js
index 45a7b431..d9b070e6 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -13,7 +13,7 @@ const domainNamesManifest = require('./manifests/internal/domain-names')
 const watchlistManifest = require('./manifests/internal/watchlist')
 const templatesManifest = require('./manifests/internal/templates')
 const crawlerManifest = require('./manifests/internal/crawler')
-const linkFeedManifest = require('./manifests/internal/link-feed')
+const feedManifest = require('./manifests/internal/feed')
 const followgraphManifest = require('./manifests/internal/followgraph')
 
 // internal apis
@@ -25,7 +25,7 @@ const domainNamesAPI = require('../dbs/domain-names')
 const watchlistAPI = require('./bg/watchlist')
 const templatesAPI = require('./bg/templates')
 const crawlerAPI = require('../crawler').WEBAPI
-const linkFeedAPI = require('./bg/link-feed')
+const feedAPI = require('./bg/feed')
 const followgraphAPI = require('./bg/followgraph')
 
 // external manifests
@@ -65,7 +65,7 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('watchlist', watchlistManifest, watchlistAPI, internalOnly)
   globals.rpcAPI.exportAPI('templates', templatesManifest, templatesAPI, internalOnly)
   globals.rpcAPI.exportAPI('crawler', crawlerManifest, crawlerAPI, internalOnly)
-  globals.rpcAPI.exportAPI('link-feed', linkFeedManifest, linkFeedAPI, internalOnly)
+  globals.rpcAPI.exportAPI('feed', feedManifest, feedAPI, internalOnly)
   globals.rpcAPI.exportAPI('followgraph', followgraphManifest, followgraphAPI, internalOnly)
 
   // external apis
diff --git a/web-apis/bg/link-feed.js b/web-apis/bg/link-feed.js
index 78aacaa7..549244a8 100644
--- a/web-apis/bg/link-feed.js
+++ b/web-apis/bg/link-feed.js
@@ -4,7 +4,7 @@ const {Url} = require('url')
 const {PermissionsError} = require('beaker-error-constants')
 const dat = require('../../dat')
 const archivesDb = require('../../dbs/archives')
-const linkFeedCrawler = require('../../crawler/link-feed')
+const feedCrawler = require('../../crawler/feed')
 
 // exported api
 // =
@@ -18,7 +18,7 @@ module.exports = {
     assert(!reverse || typeof reverse === 'boolean', 'Reverse must be a boolean')
     assert(!author || typeof author === 'string', 'Author must be a string')
     assert(!authors || !Array.isArray(author), 'Authors must be an array of strings')
-    var posts = await linkFeedCrawler.list({offset, limit, reverse, author, authors})
+    var posts = await feedCrawler.list({offset, limit, reverse, author, authors})
     await Promise.all(posts.map(async (post) => {
       post.author.title = await getUserTitle(post.author)
     }))
@@ -26,7 +26,7 @@ module.exports = {
   },
 
   async get (origin, pathname = undefined) {
-    var post = await linkFeedCrawler.get(origin, pathname)
+    var post = await feedCrawler.get(origin, pathname)
     post.author.title = await getUserTitle(post.author)
     return post
   },
@@ -35,7 +35,7 @@ module.exports = {
     var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
     var userArchive = dat.library.getArchive(userSession.url)
-    return linkFeedCrawler.create(userArchive, content)
+    return feedCrawler.create(userArchive, content)
   },
 
   async edit (pathname, content) {
@@ -43,7 +43,7 @@ module.exports = {
     var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
     var userArchive = dat.library.getArchive(userSession.url)
-    return linkFeedCrawler.edit(userArchive, pathname, content)
+    return feedCrawler.edit(userArchive, pathname, content)
   },
 
   async delete (pathname) {
@@ -51,7 +51,7 @@ module.exports = {
     var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
     var userArchive = dat.library.getArchive(userSession.url)
-    return linkFeedCrawler.delete(userArchive, pathname)
+    return feedCrawler.delete(userArchive, pathname)
   }
 }
 
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index 82bc18bc..a76d5a0e 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -11,7 +11,7 @@ const domainNamesManifest = require('../manifests/internal/domain-names')
 const watchlistManifest = require('../manifests/internal/watchlist')
 const templatesManifest = require('../manifests/internal/templates')
 const crawlerManifest = require('../manifests/internal/crawler')
-const linkFeedManifest = require('../manifests/internal/link-feed')
+const feedManifest = require('../manifests/internal/feed')
 const followgraphManifest = require('../manifests/internal/followgraph')
 
 exports.setup = function (rpc) {
@@ -30,7 +30,7 @@ exports.setup = function (rpc) {
     const watchlistRPC = rpc.importAPI('watchlist', watchlistManifest, opts)
     const templatesRPC = rpc.importAPI('templates', templatesManifest, opts)
     const crawlerRPC = rpc.importAPI('crawler', crawlerManifest, opts)
-    const linkFeedRPC = rpc.importAPI('link-feed', linkFeedManifest, opts)
+    const feedRPC = rpc.importAPI('feed', feedManifest, opts)
     const followgraphRPC = rpc.importAPI('followgraph', followgraphManifest, opts)
 
     // beaker.logger
@@ -174,13 +174,13 @@ exports.setup = function (rpc) {
     beaker.crawler.resetSite = crawlerRPC.resetSite
     beaker.crawler.createEventsStream = () => fromEventStream(crawlerRPC.createEventsStream())
 
-    // beaker.linkFeed
-    beaker.linkFeed = {}
-    beaker.linkFeed.list = linkFeedRPC.list
-    beaker.linkFeed.get = linkFeedRPC.get
-    beaker.linkFeed.create = linkFeedRPC.create
-    beaker.linkFeed.edit = linkFeedRPC.edit
-    beaker.linkFeed.delete = linkFeedRPC.delete
+    // beaker.feed
+    beaker.feed = {}
+    beaker.feed.list = feedRPC.list
+    beaker.feed.get = feedRPC.get
+    beaker.feed.create = feedRPC.create
+    beaker.feed.edit = feedRPC.edit
+    beaker.feed.delete = feedRPC.delete
 
     // beaker.followgraph
     beaker.followgraph = {}

From 75b5a8a2896fca43ba7489026db492cf543f1ded Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 19 Feb 2019 09:27:28 -0600
Subject: [PATCH 094/245] Always write unwalled.garden json records with
 2-space indentation, for readability

---
 crawler/feed.js              | 4 ++--
 crawler/followgraph.js       | 2 +-
 crawler/site-descriptions.js | 2 +-
 users/index.js               | 4 ----
 4 files changed, 4 insertions(+), 8 deletions(-)

diff --git a/crawler/feed.js b/crawler/feed.js
index c2e25e1d..9d3c549f 100644
--- a/crawler/feed.js
+++ b/crawler/feed.js
@@ -255,7 +255,7 @@ exports.create = async function (archive, content) {
     type: JSON_TYPE,
     content,
     createdAt: (new Date()).toISOString()
-  }))
+  }, null, 2))
   await crawler.crawlSite(archive)
 }
 
@@ -278,7 +278,7 @@ exports.edit = async function (archive, pathname, content) {
     content,
     createdAt: oldJson.createdAt,
     updatedAt: (new Date()).toISOString()
-  }))
+  }, null, 2))
   await crawler.crawlSite(archive)
 }
 
diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index a4f1c155..d466ec66 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -388,7 +388,7 @@ async function updateFollowsFile (archive, updateFn) {
     updateFn(followsJson)
 
     // write the follows file
-    await archive.pda.writeFile(JSON_PATH, JSON.stringify(followsJson), 'utf8')
+    await archive.pda.writeFile(JSON_PATH, JSON.stringify(followsJson, null, 2), 'utf8')
 
     // trigger crawl now
     await crawler.crawlSite(archive)
diff --git a/crawler/site-descriptions.js b/crawler/site-descriptions.js
index 16e26a68..cdae65de 100644
--- a/crawler/site-descriptions.js
+++ b/crawler/site-descriptions.js
@@ -272,7 +272,7 @@ exports.capture = async function (archive, subject) {
     logger.warn('Failed to read dat.json of subject archive', {details: {err}})
     throw new Error('Unabled to read subject dat.json')
   }
-  await archive.pda.writeFile(`/data/known-sites/${hostname}/dat.json`, JSON.stringify(datJson))
+  await archive.pda.writeFile(`/data/known-sites/${hostname}/dat.json`, JSON.stringify(datJson, null, 2))
 
   // capture thumb
   for (let ext of ['jpg', 'jpeg', 'png']) {
diff --git a/users/index.js b/users/index.js
index 4e5cf133..97384337 100644
--- a/users/index.js
+++ b/users/index.js
@@ -9,7 +9,6 @@ const archivesDb = require('../dbs/archives')
 // constants
 // =
 
-const SITE_TYPE = 'unwalled.garden/user'
 const CRAWL_TICK_INTERVAL = 5e3
 const NUM_SIMULTANEOUS_CRAWLS = 10
 
@@ -292,9 +291,6 @@ async function validateUserUrl (url) {
   if (!meta.isOwner) {
     throw new Error('User dat is not owned by this device')
   }
-  if (!meta.type.includes(SITE_TYPE)) {
-    throw new Error('User dat is not the correct type')
-  }
   if (!userSettings.isSaved) {
     throw new Error('User dat has been deleted')
   }

From b5681a7024883cf59e61fb1d191249004070d75d Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 19 Feb 2019 13:35:20 -0600
Subject: [PATCH 095/245] Add 'library' importable web api

---
 web-apis/bg.js                                |  14 +-
 web-apis/bg/experimental/library.js           | 130 ---------
 web-apis/bg/{link-feed.js => feed.js}         |   0
 web-apis/bg/library.js                        | 263 ++++++++++++++++++
 web-apis/fg/beaker.js                         |  21 --
 web-apis/fg/experimental.js                   |  12 -
 web-apis/fg/navigator-import.js               |  33 ++-
 .../external/{experimental => }/library.js    |  10 +-
 8 files changed, 304 insertions(+), 179 deletions(-)
 delete mode 100644 web-apis/bg/experimental/library.js
 rename web-apis/bg/{link-feed.js => feed.js} (100%)
 create mode 100644 web-apis/bg/library.js
 rename web-apis/manifests/external/{experimental => }/library.js (81%)

diff --git a/web-apis/bg.js b/web-apis/bg.js
index d9b070e6..54dbbfd6 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -13,8 +13,8 @@ const domainNamesManifest = require('./manifests/internal/domain-names')
 const watchlistManifest = require('./manifests/internal/watchlist')
 const templatesManifest = require('./manifests/internal/templates')
 const crawlerManifest = require('./manifests/internal/crawler')
-const feedManifest = require('./manifests/internal/feed')
-const followgraphManifest = require('./manifests/internal/followgraph')
+// const feedManifest = require('./manifests/internal/feed')
+// const followgraphManifest = require('./manifests/internal/followgraph')
 
 // internal apis
 const loggerAPI = require('../logger').WEBAPI
@@ -32,23 +32,23 @@ const followgraphAPI = require('./bg/followgraph')
 const datArchiveManifest = require('./manifests/external/dat-archive')
 const spellCheckerManifest = require('./manifests/external/spell-checker')
 const bookmarksManifest = require('./manifests/external/bookmarks')
+const libraryManifest = require('./manifests/external/library')
 
 // external apis
 const datArchiveAPI = require('./bg/dat-archive')
 const spellCheckerAPI = require('./bg/spell-checker')
 const bookmarksAPI = require('./bg/bookmarks')
+const libraryAPI = require('./bg/library')
 
 // experimental manifests
 const experimentalCapturePageManifest = require('./manifests/external/experimental/capture-page')
 const experimentalDatPeersManifest = require('./manifests/external/experimental/dat-peers')
 const experimentalGlobalFetchManifest = require('./manifests/external/experimental/global-fetch')
-const experimentalLibraryManifest = require('./manifests/external/experimental/library')
 
 // experimental apis
 const experimentalCapturePageAPI = require('./bg/experimental/capture-page')
 const experimentalDatPeersAPI = require('./bg/experimental/dat-peers')
 const experimentalGlobalFetchAPI = require('./bg/experimental/global-fetch')
-const experimentalLibraryAPI = require('./bg/experimental/library')
 
 // exported api
 // =
@@ -65,19 +65,19 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('watchlist', watchlistManifest, watchlistAPI, internalOnly)
   globals.rpcAPI.exportAPI('templates', templatesManifest, templatesAPI, internalOnly)
   globals.rpcAPI.exportAPI('crawler', crawlerManifest, crawlerAPI, internalOnly)
-  globals.rpcAPI.exportAPI('feed', feedManifest, feedAPI, internalOnly)
-  globals.rpcAPI.exportAPI('followgraph', followgraphManifest, followgraphAPI, internalOnly)
+  // globals.rpcAPI.exportAPI('feed', feedManifest, feedAPI, internalOnly)
+  // globals.rpcAPI.exportAPI('followgraph', followgraphManifest, followgraphAPI, internalOnly)
 
   // external apis
   globals.rpcAPI.exportAPI('dat-archive', datArchiveManifest, datArchiveAPI, secureOnly)
   globals.rpcAPI.exportAPI('spell-checker', spellCheckerManifest, spellCheckerAPI)
   globals.rpcAPI.exportAPI('bookmarks', bookmarksManifest, bookmarksAPI, secureOnly)
+  globals.rpcAPI.exportAPI('library', libraryManifest, libraryAPI, secureOnly)
 
   // experimental apis
   globals.rpcAPI.exportAPI('experimental-capture-page', experimentalCapturePageManifest, experimentalCapturePageAPI, secureOnly)
   globals.rpcAPI.exportAPI('experimental-dat-peers', experimentalDatPeersManifest, experimentalDatPeersAPI, secureOnly)
   globals.rpcAPI.exportAPI('experimental-global-fetch', experimentalGlobalFetchManifest, experimentalGlobalFetchAPI, secureOnly)
-  globals.rpcAPI.exportAPI('experimental-library', experimentalLibraryManifest, experimentalLibraryAPI, secureOnly)
 }
 
 function internalOnly (event, methodName, args) {
diff --git a/web-apis/bg/experimental/library.js b/web-apis/bg/experimental/library.js
deleted file mode 100644
index 363498ea..00000000
--- a/web-apis/bg/experimental/library.js
+++ /dev/null
@@ -1,130 +0,0 @@
-const globals = require('../../../globals')
-const _pick = require('lodash.pick')
-const through2 = require('through2')
-const datLibrary = require('../../../dat/library')
-const archivesDb = require('../../../dbs/archives')
-const {PermissionsError} = require('beaker-error-constants')
-
-// constants
-// =
-
-const API_DOCS_URL = 'https://beakerbrowser.com/docs/apis/experimental-library.html'
-const API_PERM_ID = 'experimentalLibrary'
-const REQUEST_ADD_PERM_ID = 'experimentalLibraryRequestAdd'
-const REQUEST_REMOVE_PERM_ID = 'experimentalLibraryRequestRemove'
-const LAB_API_ID = 'library'
-
-const QUERY_FIELDS = ['inMemory', 'isSaved', 'isNetworked', 'isOwner']
-const USER_SETTINGS_FIELDS = ['isSaved', 'expiresAt']
-const ARCHIVE_FIELDS = ['url', 'title', 'description', 'size', 'mtime', 'isOwner', 'userSettings', 'peers']
-const EVENT_FIELDS = {
-  added: ['url', 'isSaved'],
-  removed: ['url', 'isSaved'],
-  updated: ['url', 'title', 'description', 'size', 'mtime', 'isOwner'],
-  'network-changed': ['url', 'connections']
-}
-
-// exported api
-// =
-
-function add (isRequest) {
-  return async function (url, {duration} = {}) {
-    var key = datLibrary.fromURLToKey(url)
-    if (isRequest) await checkIsntOwner(key)
-    await globals.permsAPI.checkLabsPerm({
-      perm: isRequest ? `${REQUEST_ADD_PERM_ID}:${key}` : API_PERM_ID,
-      labApi: LAB_API_ID,
-      apiDocsUrl: API_DOCS_URL,
-      sender: this.sender
-    })
-
-    // swarm the archive
-    /* dont await */ datLibrary.getOrLoadArchive(key)
-
-    // update settings
-    var opts = {isSaved: true}
-    if (duration && duration > 0) {
-      opts.expiresAt = Date.now() + (duration * 60e3)
-    }
-    var settings = await archivesDb.setUserSettings(0, key, opts)
-    return _pick(settings, USER_SETTINGS_FIELDS)
-  }
-}
-
-function remove (isRequest) {
-  return async function (url) {
-    var key = datLibrary.fromURLToKey(url)
-    if (isRequest) await checkIsntOwner(key)
-    await globals.permsAPI.checkLabsPerm({
-      perm: isRequest ? `${REQUEST_REMOVE_PERM_ID}:${key}` : API_PERM_ID,
-      labApi: LAB_API_ID,
-      apiDocsUrl: API_DOCS_URL,
-      sender: this.sender
-    })
-    var settings = await archivesDb.setUserSettings(0, key, {isSaved: false})
-    return _pick(settings, USER_SETTINGS_FIELDS)
-  }
-}
-
-module.exports = {
-
-  add: add(false),
-  requestAdd: add(true),
-
-  remove: remove(false),
-  requestRemove: remove(true),
-
-  async get (url) {
-    await globals.permsAPI.checkLabsPerm({
-      perm: API_PERM_ID,
-      labApi: LAB_API_ID,
-      apiDocsUrl: API_DOCS_URL,
-      sender: this.sender
-    })
-    var key = datLibrary.fromURLToKey(url)
-    var settings = await archivesDb.getUserSettings(0, key)
-    return _pick(settings, USER_SETTINGS_FIELDS)
-  },
-
-  async list (query = {}) {
-    await globals.permsAPI.checkLabsPerm({
-      perm: API_PERM_ID,
-      labApi: LAB_API_ID,
-      apiDocsUrl: API_DOCS_URL,
-      sender: this.sender
-    })
-    query = _pick(query, QUERY_FIELDS)
-    var archives = await datLibrary.queryArchives(query)
-    return archives.map(a => {
-      a = _pick(a, ARCHIVE_FIELDS)
-      a.userSettings = _pick(a.userSettings, USER_SETTINGS_FIELDS)
-      return a
-    })
-  },
-
-  async createEventStream () {
-    await globals.permsAPI.checkLabsPerm({
-      perm: API_PERM_ID,
-      labApi: LAB_API_ID,
-      apiDocsUrl: API_DOCS_URL,
-      sender: this.sender
-    })
-    return datLibrary.createEventStream().pipe(through2.obj(function (event, enc, cb) {
-      // only emit events that have a fields set
-      var fields = EVENT_FIELDS[event[0]]
-      if (fields) {
-        event[1] = _pick(event[1].details, fields)
-        this.push(event)
-      }
-      cb()
-    }))
-  }
-}
-
-// internal methods
-// =
-
-async function checkIsntOwner (key) {
-  var meta = await archivesDb.getMeta(key)
-  if (meta.isOwner) throw new PermissionsError('Archive is owned by user')
-}
diff --git a/web-apis/bg/link-feed.js b/web-apis/bg/feed.js
similarity index 100%
rename from web-apis/bg/link-feed.js
rename to web-apis/bg/feed.js
diff --git a/web-apis/bg/library.js b/web-apis/bg/library.js
new file mode 100644
index 00000000..ab701e6f
--- /dev/null
+++ b/web-apis/bg/library.js
@@ -0,0 +1,263 @@
+const globals = require('../../globals')
+const _pick = require('lodash.pick')
+const through2 = require('through2')
+const datLibrary = require('../../dat/library')
+const archivesDb = require('../../dbs/archives')
+const {PermissionsError} = require('beaker-error-constants')
+
+// typedefs
+// =
+
+/**
+ * @typedef {import('../../dbs/archives').LibraryArchiveRecord} LibraryArchiveRecord
+ *
+ * @typedef {Object} LibraryPublicAPIRecord
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {Array<string>} type
+ * @prop {number} mtime
+ * @prop {number} size
+ * @prop {number} connections
+ * @prop {boolean} owner
+ * @prop {boolean} saved
+ * @prop {boolean} preview
+ * @prop {string} localPath
+ *
+ * @typedef {Object} LibraryPublicAPIAddedEventDetail
+ * @prop {string} url
+ *
+ * @typedef {Object} LibraryPublicAPIRemovedEventDetail
+ * @prop {string} url
+ *
+ * @typedef {Object} LibraryPublicAPIUpdatedEventDetail
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {Array<string>} type
+ * @prop {number} mtime
+ *
+ * @typedef {Object} LibraryPublicAPINetworkChangedEventDetail
+ * @prop {string} url
+ * @prop {number} connections
+ */
+
+// exported api
+// =
+
+function add (isRequest) {
+  return async function (url, opts) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    var key = datLibrary.fromURLToKey(url)
+    if (opts && 'localPath' in opts) await validateLocalPath(key, opts.localPath)
+    if (opts && 'preview' in opts) validatePreview(opts.preview)
+
+    if (isRequest) {
+      await checkIsntOwner(key)
+      // TODO make request
+    }
+
+    // swarm the archive
+    /* dont await */ datLibrary.getOrLoadArchive(key)
+
+    // update settings
+    var settings = {isSaved: true}
+    if (opts && 'localPath' in opts) settings.localSyncPath = opts.localPath
+    if (opts && 'preview' in opts) settings.previewMode = opts.preview
+    await archivesDb.setUserSettings(0, key, settings)
+  }
+}
+
+function remove (isRequest) {
+  return async function (url) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    var key = datLibrary.fromURLToKey(url)
+
+    if (isRequest) {
+      await checkIsntOwner(key)
+      // TODO make request
+    }
+
+    await archivesDb.setUserSettings(0, key, {isSaved: false})
+  }
+}
+
+module.exports = {
+  async list (opts = {}) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+
+    var query = {}
+    if (opts.filter && typeof opts.filter === 'object') {
+      if ('type' in opts.filter) {
+        validateTypeFilter(opts.filter.type)
+        query.type = opts.filter.type
+      }
+      if ('owner' in opts.filter) {
+        validateOwnerFilter(opts.filter.owner)
+        query.isOwner = opts.filter.owner
+      }
+      if ('saved' in opts.filter) {
+        validateSavedFilter(opts.filter.saved)
+        query.isSaved = opts.filter.saved
+      }
+    }
+
+    var archives = /** @type LibraryArchiveRecord[] */(await datLibrary.queryArchives(query))
+
+    return archives.map(massageArchiveRecord)
+  },
+
+  async get (url) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    var key = datLibrary.fromURLToKey(url)
+    var archive = /** @type LibraryArchiveRecord */(await datLibrary.queryArchives({key}))
+    if (archive) {
+      return massageArchiveRecord(archive)
+    }
+  },
+
+  add: add(false),
+  requestAdd: add(true),
+
+  async edit (url, opts) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    var key = datLibrary.fromURLToKey(url)
+    if (opts && 'localPath' in opts) await validateLocalPath(key, opts.localPath)
+    if (opts && 'preview' in opts) validatePreview(opts.preview)
+
+    // update settings
+    var settings = {}
+    if (opts && 'localPath' in opts) settings.localSyncPath = opts.localPath
+    if (opts && 'preview' in opts) settings.previewMode = opts.preview
+    await archivesDb.setUserSettings(0, key, settings)
+  },
+
+  remove: remove(false),
+  requestRemove: remove(true),
+
+  async uncache (url) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    await datLibrary.clearFileCache(datLibrary.fromURLToKey(url))
+  },
+
+  async createEventStream () {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    return datLibrary.createEventStream().pipe(through2.obj(function (event, enc, cb) {
+      switch (event[0]) {
+        case 'added':
+          event[1] = /** @type LibraryPublicAPIAddedEventDetail */({url: event[1].details.url})
+          this.push(event)
+          break
+        case 'removed':
+          event[1] = /** @type LibraryPublicAPIRemovedEventDetail */({url: event[1].details.url})
+          this.push(event)
+          break
+        case 'updated':
+          event[1] = /** @type LibraryPublicAPIUpdatedEventDetail */({
+            url: event[1].details.url,
+            title: event[1].details.title,
+            description: event[1].details.description,
+            type: event[1].details.type,
+            mtime: event[1].details.mtime
+          })
+          this.push(event)
+          break
+        case 'network-changed':
+          event[1] = /** @type LibraryPublicAPINetworkChangedEventDetail */({
+            url: event[1].details.url,
+            connections: event[1].details.connections
+          })
+          this.push(event)
+          break
+      }
+      cb()
+    }))
+  }
+}
+
+// internal methods
+// =
+
+async function checkIsntOwner (key) {
+  var meta = await archivesDb.getMeta(key)
+  if (meta.isOwner) throw new PermissionsError('Archive is owned by user')
+}
+
+async function assertPermission (sender, perm) {
+  if (sender.getURL().startsWith('beaker:')) {
+    return true
+  }
+  if (await globals.permsAPI.requestPermission(perm, sender)) return true
+  throw new PermissionsError()
+}
+
+function validateTypeFilter (v) {
+  if (typeof v === 'string') return
+  if (Array.isArray(v) && v.every(item => typeof item === 'string')) return
+  throw new Error('The `type` filter must be a string or array of strings')
+}
+
+function validateOwnerFilter (v) {
+  if (typeof v === 'boolean') return
+  throw new Error('The `owner` filter must be a boolean')
+}
+
+function validateSavedFilter (v) {
+  if (typeof v === 'boolean') return
+  throw new Error('The `saved` filter must be a boolean')
+}
+
+function validatePreview (v) {
+  if (typeof v === 'boolean') return
+  throw new Error('The `preview` option must be a boolean')
+}
+
+async function validateLocalPath (key, v) {
+  if (typeof v !== 'string') {
+    throw new Error('The `localPath` option must be a string')
+  }
+
+  // make sure the folder is usable
+  try {
+    await datLibrary.getDaemon().fs_assertSafePath(v)
+  } catch (e) {
+    if (e.notFound) {
+      var e2 = new Error('The target local folder can not be found')
+      e2.doesNotExist = true
+      throw e2
+    }
+    throw e
+  }
+
+  // make sure there are no conflicts with existing files
+  var archive = await datLibrary.getOrLoadArchive(key)
+  var diff = await datLibrary.getDaemon().fs_diffListing(archive, {localSyncPath: v})
+  diff = diff.filter(d => d.change === 'mod' && d.path !== '/dat.json')
+  if (diff.length) {
+    var e = new Error('There are conflicting files in the target local folder')
+    e.hasConflicts = true
+    e.conflicts = diff.map(d => d.path)
+    throw e
+  }
+}
+
+/**
+ *
+ * @param {LibraryArchiveRecord} a
+ * @returns {LibraryPublicAPIRecord}
+ */
+function massageArchiveRecord (a) {
+  return {
+    url: a.url,
+    title: a.title,
+    description: a.description,
+    type: a.type,
+    mtime: a.mtime,
+    size: a.size,
+    connections: a.peers, // .peers is attached by library.js
+    owner: a.isOwner,
+    saved: a.userSettings.isSaved,
+    preview: a.userSettings.previewMode,
+    localPath: a.userSettings.localSyncPath
+  }
+}
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index a76d5a0e..d3443be6 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -11,8 +11,6 @@ const domainNamesManifest = require('../manifests/internal/domain-names')
 const watchlistManifest = require('../manifests/internal/watchlist')
 const templatesManifest = require('../manifests/internal/templates')
 const crawlerManifest = require('../manifests/internal/crawler')
-const feedManifest = require('../manifests/internal/feed')
-const followgraphManifest = require('../manifests/internal/followgraph')
 
 exports.setup = function (rpc) {
   const beaker = {}
@@ -30,8 +28,6 @@ exports.setup = function (rpc) {
     const watchlistRPC = rpc.importAPI('watchlist', watchlistManifest, opts)
     const templatesRPC = rpc.importAPI('templates', templatesManifest, opts)
     const crawlerRPC = rpc.importAPI('crawler', crawlerManifest, opts)
-    const feedRPC = rpc.importAPI('feed', feedManifest, opts)
-    const followgraphRPC = rpc.importAPI('followgraph', followgraphManifest, opts)
 
     // beaker.logger
     beaker.logger = {}
@@ -173,23 +169,6 @@ exports.setup = function (rpc) {
     beaker.crawler.crawlSite = crawlerRPC.crawlSite
     beaker.crawler.resetSite = crawlerRPC.resetSite
     beaker.crawler.createEventsStream = () => fromEventStream(crawlerRPC.createEventsStream())
-
-    // beaker.feed
-    beaker.feed = {}
-    beaker.feed.list = feedRPC.list
-    beaker.feed.get = feedRPC.get
-    beaker.feed.create = feedRPC.create
-    beaker.feed.edit = feedRPC.edit
-    beaker.feed.delete = feedRPC.delete
-
-    // beaker.followgraph
-    beaker.followgraph = {}
-    beaker.followgraph.listFollowers = followgraphRPC.listFollowers
-    beaker.followgraph.listFollows = followgraphRPC.listFollows
-    beaker.followgraph.listFoaFs = followgraphRPC.listFoaFs
-    beaker.followgraph.isAFollowingB = followgraphRPC.isAFollowingB
-    beaker.followgraph.follow = followgraphRPC.follow
-    beaker.followgraph.unfollow = followgraphRPC.unfollow
   }
 
   return beaker
diff --git a/web-apis/fg/experimental.js b/web-apis/fg/experimental.js
index a48fa90d..2e0d53d4 100644
--- a/web-apis/fg/experimental.js
+++ b/web-apis/fg/experimental.js
@@ -3,7 +3,6 @@
 const {EventTargetFromStream} = require('./event-target')
 const errors = require('beaker-error-constants')
 
-const experimentalLibraryManifest = require('../manifests/external/experimental/library')
 const experimentalGlobalFetchManifest = require('../manifests/external/experimental/global-fetch')
 const experimentalCapturePageManifest = require('../manifests/external/experimental/capture-page')
 const experimentalDatPeersManifest = require('../manifests/external/experimental/dat-peers')
@@ -14,21 +13,10 @@ exports.setup = function (rpc) {
 
   // dat or internal only
   if (window.location.protocol === 'beaker:' || window.location.protocol === 'dat:') {
-    const libraryRPC = rpc.importAPI('experimental-library', experimentalLibraryManifest, opts)
     const globalFetchRPC = rpc.importAPI('experimental-global-fetch', experimentalGlobalFetchManifest, opts)
     const capturePageRPC = rpc.importAPI('experimental-capture-page', experimentalCapturePageManifest, opts)
     const datPeersRPC = rpc.importAPI('experimental-dat-peers', experimentalDatPeersManifest, opts)
 
-    // experimental.library
-    let libraryEvents = ['added', 'removed', 'updated', 'folder-synced', 'network-changed']
-    experimental.library = new EventTargetFromStream(libraryRPC.createEventStream.bind(libraryRPC), libraryEvents)
-    experimental.library.add = libraryRPC.add
-    experimental.library.remove = libraryRPC.remove
-    experimental.library.get = libraryRPC.get
-    experimental.library.list = libraryRPC.list
-    experimental.library.requestAdd = libraryRPC.requestAdd
-    experimental.library.requestRemove = libraryRPC.requestRemove
-
     // experimental.globalFetch
     experimental.globalFetch = async function globalFetch (input, init) {
       var request = new Request(input, init)
diff --git a/web-apis/fg/navigator-import.js b/web-apis/fg/navigator-import.js
index 327504b1..2f353d38 100644
--- a/web-apis/fg/navigator-import.js
+++ b/web-apis/fg/navigator-import.js
@@ -1,11 +1,36 @@
 const errors = require('beaker-error-constants')
-const bookmarksManifest = require('../manifests/external/bookmarks')
+const {EventTargetFromStream} = require('./event-target')
+
+const RPC_OPTS = { timeout: false, errors }
+const APIs = {
+  bookmarks: require('../manifests/external/bookmarks'),
+  library: {
+    manifest: require('../manifests/external/library'),
+    create (rpc) {
+      var libraryMethods = ['list', 'get', 'add', 'requestAdd', 'edit', 'remove', 'requestRemove', 'uncache']
+      var libraryEvents = ['added', 'removed', 'updated', 'folder-synced', 'network-changed']
+      var libraryRPC = rpc.importAPI('library', APIs.library.manifest, RPC_OPTS)
+      var api = new EventTargetFromStream(libraryRPC.createEventStream.bind(libraryRPC), libraryEvents)
+      for (let method of libraryMethods) {
+        api[method] = libraryRPC[method].bind(api)
+      }
+      return api
+    }
+  }
+  // TODO profiles: require('../manifests/external/profiles'),
+  // TODO 'unwalled-garden-feed': require('../manifests/external/unwalled-garden-feed'),
+  // TODO 'unwalled-garden-followgraph': require('../manifests/external/unwalled-garden-followgraph')
+}
+
+var cache = {}
 
 exports.setup = function (rpc) {
-  const opts = { timeout: false, errors }
   return function (name) {
-    if (name === 'bookmarks') {
-      return rpc.importAPI('bookmarks', bookmarksManifest, opts)
+    if (name in cache) return cache[name]
+    if (name in APIs) {
+      const API = APIs[name]
+      cache[name] = API.create ? API.create(rpc) : rpc.importAPI(name, APIs[name], RPC_OPTS)
+      return cache[name]
     }
     throw new Error(`Unknown API: ${name}`)
   }
diff --git a/web-apis/manifests/external/experimental/library.js b/web-apis/manifests/external/library.js
similarity index 81%
rename from web-apis/manifests/external/experimental/library.js
rename to web-apis/manifests/external/library.js
index 782a5566..f23d5eff 100644
--- a/web-apis/manifests/external/experimental/library.js
+++ b/web-apis/manifests/external/library.js
@@ -1,11 +1,11 @@
 module.exports = {
-  add: 'promise',
-  remove: 'promise',
-  get: 'promise',
   list: 'promise',
-
+  get: 'promise',
+  add: 'promise',
   requestAdd: 'promise',
+  edit: 'promise',
+  remove: 'promise',
   requestRemove: 'promise',
-
+  uncache: 'promise',
   createEventStream: 'readable'
 }

From 6324035e57b7f21095470ed4e815e912493683b2 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 19 Feb 2019 13:54:54 -0600
Subject: [PATCH 096/245] Fix opts.filter -> opts.filters

---
 web-apis/bg/library.js | 20 ++++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/web-apis/bg/library.js b/web-apis/bg/library.js
index ab701e6f..ffa8cca1 100644
--- a/web-apis/bg/library.js
+++ b/web-apis/bg/library.js
@@ -87,18 +87,18 @@ module.exports = {
     await assertPermission(this.sender, 'dangerousAppControl')
 
     var query = {}
-    if (opts.filter && typeof opts.filter === 'object') {
-      if ('type' in opts.filter) {
-        validateTypeFilter(opts.filter.type)
-        query.type = opts.filter.type
+    if (opts.filters && typeof opts.filters === 'object') {
+      if ('type' in opts.filters) {
+        validateTypeFilter(opts.filters.type)
+        query.type = opts.filters.type
       }
-      if ('owner' in opts.filter) {
-        validateOwnerFilter(opts.filter.owner)
-        query.isOwner = opts.filter.owner
+      if ('owner' in opts.filters) {
+        validateOwnerFilter(opts.filters.owner)
+        query.isOwner = opts.filters.owner
       }
-      if ('saved' in opts.filter) {
-        validateSavedFilter(opts.filter.saved)
-        query.isSaved = opts.filter.saved
+      if ('saved' in opts.filters) {
+        validateSavedFilter(opts.filters.saved)
+        query.isSaved = opts.filters.saved
       }
     }
 

From 87bc2a23219bc53e4430e7515889573132e53633 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 19 Feb 2019 15:10:48 -0600
Subject: [PATCH 097/245] Improve type annotations in library web api

---
 web-apis/bg/library.js | 48 +++++++++++++++++++++++++++++++++++++++++-
 1 file changed, 47 insertions(+), 1 deletion(-)

diff --git a/web-apis/bg/library.js b/web-apis/bg/library.js
index ffa8cca1..87177189 100644
--- a/web-apis/bg/library.js
+++ b/web-apis/bg/library.js
@@ -83,6 +83,14 @@ function remove (isRequest) {
 }
 
 module.exports = {
+  /**
+   * @param {Object} [opts]
+   * @param {Object} [opts.filters]
+   * @param {string|string[]} [opts.filters.type]
+   * @param {boolean} [opts.filters.owner]
+   * @param {boolean} [opts.filters.saved]
+   * @returns {Promise<LibraryPublicAPIRecord[]>}
+   */
   async list (opts = {}) {
     await assertPermission(this.sender, 'dangerousAppControl')
 
@@ -107,6 +115,10 @@ module.exports = {
     return archives.map(massageArchiveRecord)
   },
 
+  /**
+   * @param {string} url
+   * @returns {Promise<LibraryPublicAPIRecord>}
+   */
   async get (url) {
     await assertPermission(this.sender, 'dangerousAppControl')
     var key = datLibrary.fromURLToKey(url)
@@ -116,9 +128,31 @@ module.exports = {
     }
   },
 
+  /**
+   * @param {string} url
+   * @param {Object} [opts]
+   * @param {string} [opts.localPath]
+   * @param {boolean} [opts.preview]
+   * @returns {Promise<void>}
+   */
   add: add(false),
+
+  /**
+   * @param {string} url
+   * @param {Object} [opts]
+   * @param {string} [opts.localPath]
+   * @param {boolean} [opts.preview]
+   * @returns {Promise<void>}
+   */
   requestAdd: add(true),
 
+  /**
+   * @param {string} url
+   * @param {Object} [opts]
+   * @param {string} [opts.localPath]
+   * @param {boolean} [opts.preview]
+   * @returns {Promise<void>}
+   */
   async edit (url, opts) {
     await assertPermission(this.sender, 'dangerousAppControl')
     var key = datLibrary.fromURLToKey(url)
@@ -132,9 +166,22 @@ module.exports = {
     await archivesDb.setUserSettings(0, key, settings)
   },
 
+  /**
+   * @param {string} url
+   * @returns {Promise<void>}
+   */
   remove: remove(false),
+
+  /**
+   * @param {string} url
+   * @returns {Promise<void>}
+   */
   requestRemove: remove(true),
 
+  /**
+   * @param {string} url
+   * @returns {Promise<void>}
+   */
   async uncache (url) {
     await assertPermission(this.sender, 'dangerousAppControl')
     await datLibrary.clearFileCache(datLibrary.fromURLToKey(url))
@@ -242,7 +289,6 @@ async function validateLocalPath (key, v) {
 }
 
 /**
- *
  * @param {LibraryArchiveRecord} a
  * @returns {LibraryPublicAPIRecord}
  */

From 9be497af399c21031faf28f4a4335cce0c747884 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 19 Feb 2019 15:15:14 -0600
Subject: [PATCH 098/245] Add type annotations to bookmarks api and change
 filters.isPinned to filters.pinned

---
 dbs/bookmarks.js         |  4 +--
 web-apis/bg/bookmarks.js | 61 ++++++++++++++++++++++++++++++++++++++--
 2 files changed, 60 insertions(+), 5 deletions(-)

diff --git a/dbs/bookmarks.js b/dbs/bookmarks.js
index adde5ab4..fdb47896 100644
--- a/dbs/bookmarks.js
+++ b/dbs/bookmarks.js
@@ -155,7 +155,7 @@ exports.getBookmark = async function (profileId, href) {
  * @param {Object} [opts]
  * @param {Object} [opts.filters]
  * @param {string|string[]} [opts.filters.tag]
- * @param {boolean} [opts.filters.isPinned]
+ * @param {boolean} [opts.filters.pinned]
  * @returns {Promise<Array<Bookmark>>}
  */
 exports.listBookmarks = async function (profileId, {filters} = {}) {
@@ -168,7 +168,7 @@ exports.listBookmarks = async function (profileId, {filters} = {}) {
     .select('createdAt')
     .where('profileId', '=', profileId)
     .orderBy('createdAt', 'DESC')
-  if (filters && filters.isPinned) {
+  if (filters && filters.pinned) {
     sql = sql.where('pinned', '=', '1')
   }
 
diff --git a/web-apis/bg/bookmarks.js b/web-apis/bg/bookmarks.js
index 2acba4fe..5e1fbc51 100644
--- a/web-apis/bg/bookmarks.js
+++ b/web-apis/bg/bookmarks.js
@@ -2,27 +2,56 @@ const globals = require('../../globals')
 const {PermissionsError} = require('beaker-error-constants')
 const bookmarksDb = require('../../dbs/bookmarks')
 
+// typedefs
+// =
+
+/**
+ * @typedef {Object} BookmarkPublicAPIRecord
+ * @prop {number} createdAt
+ * @prop {string} href
+ * @prop {string} title
+ * @prop {string[]} tags
+ * @prop {boolean} pinned
+ * @prop {number} pinOrder
+ */
+
 // exported api
 // =
 
 module.exports = {
+  /**
+   * @param {Object} [opts]
+   * @param {Object} [opts.filters]
+   * @param {string|string[]} [opts.filters.tag]
+   * @param {boolean} [opts.filters.pinned]
+   * @returns {Promise<BookmarkPublicAPIRecord[]>}
+   */
   async list (opts) {
     await assertPermission(this.sender, 'dangerousAppControl')
     return bookmarksDb.listBookmarks(0, opts)
   },
 
+  /**
+   * @returns {Promise<string[]>}
+   */
   async listTags () {
     await assertPermission(this.sender, 'dangerousAppControl')
     return bookmarksDb.listBookmarkTags(0)
   },
 
-  // fetch bookmark data from the current user's data
+  /**
+   * @param {string} href 
+   * @returns {Promise<BookmarkPublicAPIRecord>}
+   */
   async get (href) {
     await assertPermission(this.sender, 'dangerousAppControl')
     return bookmarksDb.getBookmark(0, href)
   },
 
-  // check if bookmark exists in the current user's data
+  /**
+   * @param {string} href 
+   * @returns {Promise<boolean>}
+   */
   async has (href) {
     await assertPermission(this.sender, 'dangerousAppControl')
     try {
@@ -33,26 +62,52 @@ module.exports = {
     }
   },
 
+  /**
+   * @param {Object} data
+   * @param {string} [data.href]
+   * @param {string} [data.title]
+   * @param {string | string[]} [data.tags]
+   * @param {boolean} [data.pinned]
+   * @returns {Promise<void>}
+   */
   async add (data) {
     await assertPermission(this.sender, 'dangerousAppControl')
     await bookmarksDb.addBookmark(0, data)
   },
 
+  /**
+   * @param {string} href
+   * @param {Object} data
+   * @param {string} [data.href]
+   * @param {string} [data.title]
+   * @param {string | string[]} [data.tags]
+   * @param {boolean} [data.pinned]
+   * @returns {Promise<void>}
+   */
   async edit (href, data = {}) {
     await assertPermission(this.sender, 'dangerousAppControl')
     await bookmarksDb.editBookmark(0, href, data)
   },
 
+  /**
+   * @param {string} href
+   * @returns {Promise<void>}
+   */
   async remove (href) {
     await assertPermission(this.sender, 'dangerousAppControl')
     await bookmarksDb.removeBookmark(0, href)
   },
 
+  /**
+   * @param {Object} opts 
+   * @param {string[]} [opts.pins]
+   * @returns {Promise<void>}
+   */
   async configure (opts) {
     await assertPermission(this.sender, 'dangerousAppControl')
     if (opts.pins) {
       if (!Array.isArray(opts.pins)) throw new Error('.pins must be an array of URLs')
-      return bookmarksDb.setBookmarkPinOrder(0, opts.pins)
+      await bookmarksDb.setBookmarkPinOrder(0, opts.pins)
     }
   }
 }

From 7aa4f08adce59a1a75f179134c37f9731d4a4a9c Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 19 Feb 2019 15:53:20 -0600
Subject: [PATCH 099/245] Add 'profiles' importable web api

---
 dat/library.js                          |  4 +-
 web-apis/bg.js                          |  3 ++
 web-apis/bg/bookmarks.js                |  6 +--
 web-apis/bg/profiles.js                 | 60 +++++++++++++++++++++++++
 web-apis/fg/navigator-import.js         | 26 +++++++++--
 web-apis/manifests/external/profiles.js |  4 ++
 6 files changed, 96 insertions(+), 7 deletions(-)
 create mode 100644 web-apis/bg/profiles.js
 create mode 100644 web-apis/manifests/external/profiles.js

diff --git a/dat/library.js b/dat/library.js
index 07e64fce..5ea4add7 100644
--- a/dat/library.js
+++ b/dat/library.js
@@ -470,6 +470,8 @@ exports.updateSizeTracking = function updateSizeTracking (archive) {
 exports.queryArchives = async function queryArchives (query) {
   // run the query
   var archiveInfos = await archivesDb.query(0, query)
+  var isArray = Array.isArray(archiveInfos)
+  if (!isArray) archiveInfos = [archiveInfos]
 
   if (query && ('inMemory' in query)) {
     archiveInfos = archiveInfos.filter(archiveInfo => isArchiveLoaded(archiveInfo.key) === query.inMemory)
@@ -490,7 +492,7 @@ exports.queryArchives = async function queryArchives (query) {
       archiveInfo.peerHistory = []
     }
   }))
-  return archiveInfos
+  return isArray ? archiveInfos : archiveInfos[0]
 }
 
 exports.getArchiveInfo = async function getArchiveInfo (key) {
diff --git a/web-apis/bg.js b/web-apis/bg.js
index 54dbbfd6..687d3ec8 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -33,12 +33,14 @@ const datArchiveManifest = require('./manifests/external/dat-archive')
 const spellCheckerManifest = require('./manifests/external/spell-checker')
 const bookmarksManifest = require('./manifests/external/bookmarks')
 const libraryManifest = require('./manifests/external/library')
+const profilesManifest = require('./manifests/external/profiles')
 
 // external apis
 const datArchiveAPI = require('./bg/dat-archive')
 const spellCheckerAPI = require('./bg/spell-checker')
 const bookmarksAPI = require('./bg/bookmarks')
 const libraryAPI = require('./bg/library')
+const profilesAPI = require('./bg/profiles')
 
 // experimental manifests
 const experimentalCapturePageManifest = require('./manifests/external/experimental/capture-page')
@@ -73,6 +75,7 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('spell-checker', spellCheckerManifest, spellCheckerAPI)
   globals.rpcAPI.exportAPI('bookmarks', bookmarksManifest, bookmarksAPI, secureOnly)
   globals.rpcAPI.exportAPI('library', libraryManifest, libraryAPI, secureOnly)
+  globals.rpcAPI.exportAPI('profiles', profilesManifest, profilesAPI, secureOnly)
 
   // experimental apis
   globals.rpcAPI.exportAPI('experimental-capture-page', experimentalCapturePageManifest, experimentalCapturePageAPI, secureOnly)
diff --git a/web-apis/bg/bookmarks.js b/web-apis/bg/bookmarks.js
index 5e1fbc51..8ab904d1 100644
--- a/web-apis/bg/bookmarks.js
+++ b/web-apis/bg/bookmarks.js
@@ -40,7 +40,7 @@ module.exports = {
   },
 
   /**
-   * @param {string} href 
+   * @param {string} href
    * @returns {Promise<BookmarkPublicAPIRecord>}
    */
   async get (href) {
@@ -49,7 +49,7 @@ module.exports = {
   },
 
   /**
-   * @param {string} href 
+   * @param {string} href
    * @returns {Promise<boolean>}
    */
   async has (href) {
@@ -99,7 +99,7 @@ module.exports = {
   },
 
   /**
-   * @param {Object} opts 
+   * @param {Object} opts
    * @param {string[]} [opts.pins]
    * @returns {Promise<void>}
    */
diff --git a/web-apis/bg/profiles.js b/web-apis/bg/profiles.js
new file mode 100644
index 00000000..c4f07c95
--- /dev/null
+++ b/web-apis/bg/profiles.js
@@ -0,0 +1,60 @@
+const globals = require('../../globals')
+const datLibrary = require('../../dat/library')
+const {PermissionsError} = require('beaker-error-constants')
+
+// typedefs
+// =
+
+/**
+ * @typedef {import('../../dbs/archives').LibraryArchiveRecord} LibraryArchiveRecord
+ * 
+ * @typedef {Object} ProfilesPublicAPIRecord
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {string[]} type
+ */
+
+// exported api
+// =
+
+async function get (url) {
+  var key = datLibrary.fromURLToKey(url)
+  var archive = /** @type LibraryArchiveRecord */(await datLibrary.queryArchives({key}))
+  if (!archive) return null
+  return {
+    url,
+    title: archive.title,
+    description: archive.description,
+    type: archive.type
+  }
+}
+
+module.exports = {
+  /**
+   * @returns {Promise<ProfilesPublicAPIRecord>}
+   */
+  async getCurrentUser () {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    var sess = globals.userSessionAPI.getFor(this.sender)
+    if (!sess) return null
+    return get(sess.url)
+  },
+
+  /**
+   * @param {string} url
+   * @returns {Promise<ProfilesPublicAPIRecord>}
+   */
+  async get (url) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    return get(url)
+  }
+}
+
+async function assertPermission (sender, perm) {
+  if (sender.getURL().startsWith('beaker:')) {
+    return true
+  }
+  if (await globals.permsAPI.requestPermission(perm, sender)) return true
+  throw new PermissionsError()
+}
diff --git a/web-apis/fg/navigator-import.js b/web-apis/fg/navigator-import.js
index 2f353d38..e59b4f86 100644
--- a/web-apis/fg/navigator-import.js
+++ b/web-apis/fg/navigator-import.js
@@ -3,7 +3,17 @@ const {EventTargetFromStream} = require('./event-target')
 
 const RPC_OPTS = { timeout: false, errors }
 const APIs = {
-  bookmarks: require('../manifests/external/bookmarks'),
+  bookmarks: {
+    manifest: require('../manifests/external/bookmarks'),
+    create (rpc) {
+      var bookmarksRPC = rpc.importAPI('bookmarks', APIs.bookmarks.manifest, RPC_OPTS)
+      var api = {}
+      for (let method in APIs.bookmarks.manifest) {
+        api[method] = bookmarksRPC[method].bind(api)
+      }
+      return api
+    }
+  },
   library: {
     manifest: require('../manifests/external/library'),
     create (rpc) {
@@ -16,8 +26,18 @@ const APIs = {
       }
       return api
     }
+  },
+  profiles: {
+    manifest: require('../manifests/external/profiles'),
+    create (rpc) {
+      var profilesRPC = rpc.importAPI('profiles', APIs.profiles.manifest, RPC_OPTS)
+      var api = {}
+      for (let method in APIs.profiles.manifest) {
+        api[method] = profilesRPC[method].bind(api)
+      }
+      return api
+    }
   }
-  // TODO profiles: require('../manifests/external/profiles'),
   // TODO 'unwalled-garden-feed': require('../manifests/external/unwalled-garden-feed'),
   // TODO 'unwalled-garden-followgraph': require('../manifests/external/unwalled-garden-followgraph')
 }
@@ -29,7 +49,7 @@ exports.setup = function (rpc) {
     if (name in cache) return cache[name]
     if (name in APIs) {
       const API = APIs[name]
-      cache[name] = API.create ? API.create(rpc) : rpc.importAPI(name, APIs[name], RPC_OPTS)
+      cache[name] = API.create(rpc)
       return cache[name]
     }
     throw new Error(`Unknown API: ${name}`)
diff --git a/web-apis/manifests/external/profiles.js b/web-apis/manifests/external/profiles.js
new file mode 100644
index 00000000..ec0f400a
--- /dev/null
+++ b/web-apis/manifests/external/profiles.js
@@ -0,0 +1,4 @@
+module.exports = {
+  getCurrentUser: 'promise',
+  get: 'promise'
+}
\ No newline at end of file

From a0b06ad4a1d0de2ecb6024b96fe8cca811232953 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 19 Feb 2019 17:10:04 -0600
Subject: [PATCH 100/245] Add 'unwalled-garden-feed' importable web api

---
 crawler/feed.js                               |  85 ++++-----
 web-apis/bg.js                                |   6 +-
 web-apis/bg/feed.js                           |  64 -------
 web-apis/bg/library.js                        |   1 -
 web-apis/bg/profiles.js                       |   2 +-
 web-apis/bg/unwalled-garden-feed.js           | 174 ++++++++++++++++++
 web-apis/fg/navigator-import.js               |  12 +-
 .../external/unwalled-garden-feed.js          |   7 +
 web-apis/manifests/internal/link-feed.js      |   7 -
 9 files changed, 240 insertions(+), 118 deletions(-)
 delete mode 100644 web-apis/bg/feed.js
 create mode 100644 web-apis/bg/unwalled-garden-feed.js
 create mode 100644 web-apis/manifests/external/unwalled-garden-feed.js
 delete mode 100644 web-apis/manifests/internal/link-feed.js

diff --git a/crawler/feed.js b/crawler/feed.js
index 9d3c549f..f3abac9c 100644
--- a/crawler/feed.js
+++ b/crawler/feed.js
@@ -119,7 +119,7 @@ exports.crawlSite = async function (archive, crawlSource) {
         if (isNaN(post.updatedAt)) post.updatedAt = 0 // optional
 
         // upsert
-        let existingPost = await get(archive.url, changedPost.name)
+        let existingPost = await getPost(archive.url, changedPost.name)
         if (existingPost) {
           await db.run(`
             UPDATE crawl_posts
@@ -148,29 +148,29 @@ exports.crawlSite = async function (archive, crawlSource) {
  * @description
  * List crawled posts.
  *
- * @param {Object} [opts]
- * @param {string} [opts.author] - (URL) filter descriptions to those created by this author.
- * @param {Array<string>} [opts.authors] - (URL) filter descriptions to those created by these authors.
- * @param {number} [opts.offset]
- * @param {number} [opts.limit]
- * @param {boolean} [opts.reverse]
+  * @param {Object} [opts]
+  * @param {Object} [opts.filters]
+  * @param {string|string[]} [opts.filters.authors]
+  * @param {number} [opts.offset=0]
+  * @param {number} [opts.limit]
+  * @param {boolean} [opts.reverse]
  * @returns {Promise<Array<Post>>}
  */
-exports.list = async function ({offset, limit, reverse, author, authors} = {}) {
+exports.query = async function (opts) {
   // validate & parse params
-  assert(!offset || typeof offset === 'number', 'Offset must be a number')
-  assert(!limit || typeof limit === 'number', 'Limit must be a number')
-  assert(!reverse || typeof reverse === 'boolean', 'Reverse must be a boolean')
-  assert(!author || typeof author === 'string', 'Author must be a string')
-  assert(!authors || (Array.isArray(authors) && authors.every(isString)), 'Authors must be an array of strings')
-
-  if (author) {
-    authors = authors || []
-    authors.push(author)
-  }
-  if (authors) {
-    try { authors = authors.map(toOrigin) }
-    catch (e) { throw new Error('Author/authors must contain valid URLs') }
+  if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+  if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+  if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+  if (opts && opts.filters) {
+    if ('authors' in opts.filters) {
+      if (Array.isArray(opts.filters.authors)) {
+        assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        opts.filters.authors = [opts.filters.authors]
+      }
+      opts.filters.authors = opts.filters.authors.map(toAuthorOrigin)
+    }
   }
 
   // build query
@@ -179,25 +179,25 @@ exports.list = async function ({offset, limit, reverse, author, authors} = {}) {
       INNER JOIN crawl_sources src ON src.id = crawl_posts.crawlSourceId
   `
   var values = []
-  if (authors) {
+  if (opts && opts.filters && opts.filters.authors) {
     let op = 'WHERE'
-    for (let a of authors) {
+    for (let a of opts.filters.authors) {
       query += ` ${op} src.url = ?`
       op = 'OR'
       values.push(a)
     }
   }
   query += ` ORDER BY createdAt`
-  if (reverse) {
+  if (opts && opts.reverse) {
     query += ` DESC`
   }
-  if (limit) {
+  if (opts && opts.limit) {
     query += ` LIMIT ?`
-    values.push(limit)
+    values.push(opts.limit)
   }
-  if (offset) {
+  if (opts && opts.offset) {
     query += ` OFFSET ?`
-    values.push(offset)
+    values.push(opts.offset)
   }
 
   // execute query
@@ -209,18 +209,16 @@ exports.list = async function ({offset, limit, reverse, author, authors} = {}) {
  * @description
  * Get crawled post.
  *
- * @param {string} url - The URL of the post or of the author (if pathname is provided).
- * @param {string} [pathname] - The pathname of the post.
+ * @param {string} url - The URL of the post
  * @returns {Promise<Post>}
  */
-const get = exports.get = async function (url, pathname = undefined) {
+const getPost = exports.getPost = async function (url) {
   // validate & parse params
   var urlParsed
   if (url) {
     try { urlParsed = new URL(url) }
-    catch (e) { throw new Error('Failed to parse post URL: ' + url) }
+    catch (e) { throw new Error('Invalid URL: ' + url) }
   }
-  pathname = pathname || urlParsed.pathname
 
   // execute query
   return await massagePostRow(await db.get(`
@@ -232,7 +230,7 @@ const get = exports.get = async function (url, pathname = undefined) {
         AND src.url = ?
       WHERE
         crawl_posts.pathname = ?
-  `, [urlParsed.origin, pathname]))
+  `, [urlParsed.origin, urlParsed.pathname]))
 }
 
 /**
@@ -244,7 +242,7 @@ const get = exports.get = async function (url, pathname = undefined) {
  * @param {string} content.body
  * @returns {Promise}
  */
-exports.create = async function (archive, content) {
+exports.addPost = async function (archive, content) {
   var valid = validatePostContent(content)
   if (!valid) throw ajv.errorsText(validatePostContent.errors)
 
@@ -269,7 +267,7 @@ exports.create = async function (archive, content) {
  * @param {string} content.body
  * @returns {Promise}
  */
-exports.edit = async function (archive, pathname, content) {
+exports.editPost = async function (archive, pathname, content) {
   var valid = validatePostContent(content)
   if (!valid) throw ajv.errorsText(validatePostContent.errors)
   var oldJson = JSON.parse(await archive.pda.readFile(pathname))
@@ -290,7 +288,7 @@ exports.edit = async function (archive, pathname, content) {
  * @param {string} pathname - the pathname of the post.
  * @returns {Promise}
  */
-exports.delete = async function (archive, pathname) {
+exports.deletePost = async function (archive, pathname) {
   assert(typeof pathname === 'string', 'Delete() must be provided a valid URL string')
   await archive.pda.unlink(pathname)
   await crawler.crawlSite(archive)
@@ -300,11 +298,16 @@ exports.delete = async function (archive, pathname) {
 // =
 
 /**
- * @param {string} v
- * @returns {boolean}
+ * @param {string} url
+ * @returns {string}
  */
-function isString (v) {
-  return typeof v === 'string'
+function toAuthorOrigin (url) {
+  try {
+    var urlParsed = new URL(url)
+    return urlParsed.protocol + '//' + urlParsed.hostname
+  } catch (e) {
+    throw new Error('Invalid URL: ' + url)
+  }
 }
 
 /**
diff --git a/web-apis/bg.js b/web-apis/bg.js
index 687d3ec8..aa5b6fde 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -13,7 +13,6 @@ const domainNamesManifest = require('./manifests/internal/domain-names')
 const watchlistManifest = require('./manifests/internal/watchlist')
 const templatesManifest = require('./manifests/internal/templates')
 const crawlerManifest = require('./manifests/internal/crawler')
-// const feedManifest = require('./manifests/internal/feed')
 // const followgraphManifest = require('./manifests/internal/followgraph')
 
 // internal apis
@@ -25,7 +24,6 @@ const domainNamesAPI = require('../dbs/domain-names')
 const watchlistAPI = require('./bg/watchlist')
 const templatesAPI = require('./bg/templates')
 const crawlerAPI = require('../crawler').WEBAPI
-const feedAPI = require('./bg/feed')
 const followgraphAPI = require('./bg/followgraph')
 
 // external manifests
@@ -34,6 +32,7 @@ const spellCheckerManifest = require('./manifests/external/spell-checker')
 const bookmarksManifest = require('./manifests/external/bookmarks')
 const libraryManifest = require('./manifests/external/library')
 const profilesManifest = require('./manifests/external/profiles')
+const feedManifest = require('./manifests/external/unwalled-garden-feed')
 
 // external apis
 const datArchiveAPI = require('./bg/dat-archive')
@@ -41,6 +40,7 @@ const spellCheckerAPI = require('./bg/spell-checker')
 const bookmarksAPI = require('./bg/bookmarks')
 const libraryAPI = require('./bg/library')
 const profilesAPI = require('./bg/profiles')
+const feedAPI = require('./bg/unwalled-garden-feed')
 
 // experimental manifests
 const experimentalCapturePageManifest = require('./manifests/external/experimental/capture-page')
@@ -67,7 +67,6 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('watchlist', watchlistManifest, watchlistAPI, internalOnly)
   globals.rpcAPI.exportAPI('templates', templatesManifest, templatesAPI, internalOnly)
   globals.rpcAPI.exportAPI('crawler', crawlerManifest, crawlerAPI, internalOnly)
-  // globals.rpcAPI.exportAPI('feed', feedManifest, feedAPI, internalOnly)
   // globals.rpcAPI.exportAPI('followgraph', followgraphManifest, followgraphAPI, internalOnly)
 
   // external apis
@@ -76,6 +75,7 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('bookmarks', bookmarksManifest, bookmarksAPI, secureOnly)
   globals.rpcAPI.exportAPI('library', libraryManifest, libraryAPI, secureOnly)
   globals.rpcAPI.exportAPI('profiles', profilesManifest, profilesAPI, secureOnly)
+  globals.rpcAPI.exportAPI('unwalled-garden-feed', feedManifest, feedAPI, secureOnly)
 
   // experimental apis
   globals.rpcAPI.exportAPI('experimental-capture-page', experimentalCapturePageManifest, experimentalCapturePageAPI, secureOnly)
diff --git a/web-apis/bg/feed.js b/web-apis/bg/feed.js
deleted file mode 100644
index 549244a8..00000000
--- a/web-apis/bg/feed.js
+++ /dev/null
@@ -1,64 +0,0 @@
-const globals = require('../../globals')
-const assert = require('assert')
-const {Url} = require('url')
-const {PermissionsError} = require('beaker-error-constants')
-const dat = require('../../dat')
-const archivesDb = require('../../dbs/archives')
-const feedCrawler = require('../../crawler/feed')
-
-// exported api
-// =
-
-module.exports = {
-
-  async list ({offset, limit, reverse, author, authors} = {}) {
-    // validate & parse params
-    assert(!offset || typeof offset === 'number', 'Offset must be a number')
-    assert(!limit || typeof limit === 'number', 'Limit must be a number')
-    assert(!reverse || typeof reverse === 'boolean', 'Reverse must be a boolean')
-    assert(!author || typeof author === 'string', 'Author must be a string')
-    assert(!authors || !Array.isArray(author), 'Authors must be an array of strings')
-    var posts = await feedCrawler.list({offset, limit, reverse, author, authors})
-    await Promise.all(posts.map(async (post) => {
-      post.author.title = await getUserTitle(post.author)
-    }))
-    return posts
-  },
-
-  async get (origin, pathname = undefined) {
-    var post = await feedCrawler.get(origin, pathname)
-    post.author.title = await getUserTitle(post.author)
-    return post
-  },
-
-  async create (content) {
-    var userSession = globals.userSessionAPI.getFor(this.sender)
-    if (!userSession) throw new Error('No active user session')
-    var userArchive = dat.library.getArchive(userSession.url)
-    return feedCrawler.create(userArchive, content)
-  },
-
-  async edit (pathname, content) {
-    assert(typeof pathname === 'string', 'Edit() must be provided a valid URL string')
-    var userSession = globals.userSessionAPI.getFor(this.sender)
-    if (!userSession) throw new Error('No active user session')
-    var userArchive = dat.library.getArchive(userSession.url)
-    return feedCrawler.edit(userArchive, pathname, content)
-  },
-
-  async delete (pathname) {
-    assert(typeof pathname === 'string', 'Delete() must be provided a valid URL string')
-    var userSession = globals.userSessionAPI.getFor(this.sender)
-    if (!userSession) throw new Error('No active user session')
-    var userArchive = dat.library.getArchive(userSession.url)
-    return feedCrawler.delete(userArchive, pathname)
-  }
-}
-
-// internal methods
-// =
-
-async function getUserTitle (author) {
-  var meta = await archivesDb.getMeta(author.url.slice('dat://'.length))
-  return meta ? meta.title : false
-}
\ No newline at end of file
diff --git a/web-apis/bg/library.js b/web-apis/bg/library.js
index 87177189..34d1f3bb 100644
--- a/web-apis/bg/library.js
+++ b/web-apis/bg/library.js
@@ -1,5 +1,4 @@
 const globals = require('../../globals')
-const _pick = require('lodash.pick')
 const through2 = require('through2')
 const datLibrary = require('../../dat/library')
 const archivesDb = require('../../dbs/archives')
diff --git a/web-apis/bg/profiles.js b/web-apis/bg/profiles.js
index c4f07c95..80175163 100644
--- a/web-apis/bg/profiles.js
+++ b/web-apis/bg/profiles.js
@@ -7,7 +7,7 @@ const {PermissionsError} = require('beaker-error-constants')
 
 /**
  * @typedef {import('../../dbs/archives').LibraryArchiveRecord} LibraryArchiveRecord
- * 
+ *
  * @typedef {Object} ProfilesPublicAPIRecord
  * @prop {string} url
  * @prop {string} title
diff --git a/web-apis/bg/unwalled-garden-feed.js b/web-apis/bg/unwalled-garden-feed.js
new file mode 100644
index 00000000..ac466a6a
--- /dev/null
+++ b/web-apis/bg/unwalled-garden-feed.js
@@ -0,0 +1,174 @@
+const globals = require('../../globals')
+const assert = require('assert')
+const {URL} = require('url')
+const {PermissionsError} = require('beaker-error-constants')
+const dat = require('../../dat')
+const archivesDb = require('../../dbs/archives')
+const feedCrawler = require('../../crawler/feed')
+
+// typedefs
+// =
+
+/**
+ * @typedef {Object} FeedAuthorPublicAPIRecord
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {Array<string>} type 
+ * 
+ * @typedef {Object} FeedPostPublicAPIRecord
+ * @prop {string} url
+ * @prop {Object} content
+ * @prop {string} content.body
+ * @prop {number} crawledAt
+ * @prop {number} createdAt
+ * @prop {number} updatedAt
+ * @prop {FeedAuthorPublicAPIRecord} author
+ */
+
+// exported api
+// =
+
+module.exports = {
+
+  /**
+   * @param {Object} [opts]
+   * @param {Object} [opts.filters]
+   * @param {string|string[]} [opts.filters.authors]
+   * @param {number} [opts.offset=0]
+   * @param {number} [opts.limit]
+   * @param {boolean} [opts.reverse]
+   * @returns {Promise<FeedPostPublicAPIRecord[]>}
+   */
+  async query (opts) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+    if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+    if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+    if (opts && opts.filters) {
+      if ('authors' in opts.filters) {
+        if (Array.isArray(opts.filters.authors)) {
+          assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        }
+      }
+    }
+    var posts = await feedCrawler.query(opts)
+    return Promise.all(posts.map(massagePostRecord))
+  },
+
+  /**
+   * @param {string} url
+   * @returns {Promise<FeedPostPublicAPIRecord>}
+   */
+  async getPost (url) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    return massagePostRecord(await feedCrawler.getPost(url))
+  },
+
+  /**
+   * @param {Object} post 
+   * @param {Object} post.content
+   * @param {string} post.content.body
+   * @returns {Promise<void>}
+   */
+  async addPost (post) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+
+    assert(post && typeof post === 'object', 'The `post` parameter must be an object')
+    assert(post.content && typeof post.content === 'object', 'The `post.content` parameter must be an object')
+    assert(post.content.body && typeof post.content.body === 'string', 'The `post.content.body` parameter must be a non-empty string')
+
+    var userSession = globals.userSessionAPI.getFor(this.sender)
+    if (!userSession) throw new Error('No active user session')
+    
+    var userArchive = dat.library.getArchive(userSession.url)
+    await feedCrawler.addPost(userArchive, post.content)
+  },
+
+  /**
+   * @param {string} url
+   * @param {Object} post 
+   * @param {Object} post.content
+   * @param {string} post.content.body
+   * @returns {Promise<void>}
+   */
+  async editPost (url, post) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+
+    assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
+    assert(post && typeof post === 'object', 'The `post` parameter must be an object')
+    assert(post.content && typeof post.content === 'object', 'The `post.content` parameter must be an object')
+    assert(post.content.body && typeof post.content.body === 'string', 'The `post.content.body` parameter must be a non-empty string')
+
+    var userSession = globals.userSessionAPI.getFor(this.sender)
+    if (!userSession) throw new Error('No active user session')
+    url = urlToPathname(url)
+
+    var userArchive = dat.library.getArchive(userSession.url)
+    await feedCrawler.editPost(userArchive, url, post.content)
+  },
+
+  /**
+   * @param {string} url
+   * @returns {Promise<void>}
+   */
+  async deletePost (url) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+
+    assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
+
+    var userSession = globals.userSessionAPI.getFor(this.sender)
+    if (!userSession) throw new Error('No active user session')
+    url = urlToPathname(url)
+
+    var userArchive = dat.library.getArchive(userSession.url)
+    await feedCrawler.deletePost(userArchive, url)
+  }
+}
+
+// internal methods
+// =
+
+async function assertPermission (sender, perm) {
+  if (sender.getURL().startsWith('beaker:')) {
+    return true
+  }
+  if (await globals.permsAPI.requestPermission(perm, sender)) return true
+  throw new PermissionsError()
+}
+
+/**
+ * Tries to parse the URL and return the pathname. If fails, assumes the string was a pathname.
+ * @param {string} url 
+ * @returns {string}
+ */
+function urlToPathname (url) {
+  try {
+    var urlParsed = new URL(url)
+    if (urlParsed.pathname && urlParsed.pathname !== '/') {
+      return urlParsed.pathname
+    }
+  } catch (e) {
+    return url
+  }
+}
+
+function massagePostRecord (post) {
+  return {
+    url: post.author.url + post.pathname,
+    content: {
+      body: post.content.body
+    },
+    crawledAt: post.crawledAt,
+    createdAt: post.createdAt,
+    updatedAt: post.updatedAt,
+    author: {
+      url: post.author.url,
+      title: post.author.title,
+      description: post.author.description,
+      type: post.author.type
+    }
+  }
+}
diff --git a/web-apis/fg/navigator-import.js b/web-apis/fg/navigator-import.js
index e59b4f86..a04fbd89 100644
--- a/web-apis/fg/navigator-import.js
+++ b/web-apis/fg/navigator-import.js
@@ -37,8 +37,18 @@ const APIs = {
       }
       return api
     }
+  },
+  'unwalled-garden-feed': {
+    manifest: require('../manifests/external/unwalled-garden-feed'),
+    create (rpc) {
+      var feedRPC = rpc.importAPI('unwalled-garden-feed', APIs['unwalled-garden-feed'].manifest, RPC_OPTS)
+      var api = {}
+      for (let method in APIs['unwalled-garden-feed'].manifest) {
+        api[method] = feedRPC[method].bind(api)
+      }
+      return api
+    }
   }
-  // TODO 'unwalled-garden-feed': require('../manifests/external/unwalled-garden-feed'),
   // TODO 'unwalled-garden-followgraph': require('../manifests/external/unwalled-garden-followgraph')
 }
 
diff --git a/web-apis/manifests/external/unwalled-garden-feed.js b/web-apis/manifests/external/unwalled-garden-feed.js
new file mode 100644
index 00000000..494754f2
--- /dev/null
+++ b/web-apis/manifests/external/unwalled-garden-feed.js
@@ -0,0 +1,7 @@
+module.exports = {
+  query: 'promise',
+  getPost: 'promise',
+  addPost: 'promise',
+  editPost: 'promise',
+  deletePost: 'promise'
+}
\ No newline at end of file
diff --git a/web-apis/manifests/internal/link-feed.js b/web-apis/manifests/internal/link-feed.js
deleted file mode 100644
index b4e21d9b..00000000
--- a/web-apis/manifests/internal/link-feed.js
+++ /dev/null
@@ -1,7 +0,0 @@
-module.exports = {
-  list: 'promise',
-  get: 'promise',
-  create: 'promise',
-  edit: 'promise',
-  delete: 'promise'
-}
\ No newline at end of file

From 22d66c680aa7804811bebcf1c880680c6865d5fd Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 19 Feb 2019 20:02:11 -0600
Subject: [PATCH 101/245] Add 'unwalled-garden-followgraph' importable web api

---
 web-apis/bg.js                                |   6 +-
 web-apis/bg/followgraph.js                    |  82 ---------
 web-apis/bg/unwalled-garden-feed.js           |  13 +-
 web-apis/bg/unwalled-garden-followgraph.js    | 171 ++++++++++++++++++
 web-apis/fg/navigator-import.js               |  12 +-
 .../unwalled-garden-followgraph.js}           |   1 -
 6 files changed, 191 insertions(+), 94 deletions(-)
 delete mode 100644 web-apis/bg/followgraph.js
 create mode 100644 web-apis/bg/unwalled-garden-followgraph.js
 rename web-apis/manifests/{internal/followgraph.js => external/unwalled-garden-followgraph.js} (85%)

diff --git a/web-apis/bg.js b/web-apis/bg.js
index aa5b6fde..03de803a 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -13,7 +13,6 @@ const domainNamesManifest = require('./manifests/internal/domain-names')
 const watchlistManifest = require('./manifests/internal/watchlist')
 const templatesManifest = require('./manifests/internal/templates')
 const crawlerManifest = require('./manifests/internal/crawler')
-// const followgraphManifest = require('./manifests/internal/followgraph')
 
 // internal apis
 const loggerAPI = require('../logger').WEBAPI
@@ -24,7 +23,6 @@ const domainNamesAPI = require('../dbs/domain-names')
 const watchlistAPI = require('./bg/watchlist')
 const templatesAPI = require('./bg/templates')
 const crawlerAPI = require('../crawler').WEBAPI
-const followgraphAPI = require('./bg/followgraph')
 
 // external manifests
 const datArchiveManifest = require('./manifests/external/dat-archive')
@@ -33,6 +31,7 @@ const bookmarksManifest = require('./manifests/external/bookmarks')
 const libraryManifest = require('./manifests/external/library')
 const profilesManifest = require('./manifests/external/profiles')
 const feedManifest = require('./manifests/external/unwalled-garden-feed')
+const followgraphManifest = require('./manifests/external/unwalled-garden-followgraph')
 
 // external apis
 const datArchiveAPI = require('./bg/dat-archive')
@@ -41,6 +40,7 @@ const bookmarksAPI = require('./bg/bookmarks')
 const libraryAPI = require('./bg/library')
 const profilesAPI = require('./bg/profiles')
 const feedAPI = require('./bg/unwalled-garden-feed')
+const followgraphAPI = require('./bg/unwalled-garden-followgraph')
 
 // experimental manifests
 const experimentalCapturePageManifest = require('./manifests/external/experimental/capture-page')
@@ -67,7 +67,6 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('watchlist', watchlistManifest, watchlistAPI, internalOnly)
   globals.rpcAPI.exportAPI('templates', templatesManifest, templatesAPI, internalOnly)
   globals.rpcAPI.exportAPI('crawler', crawlerManifest, crawlerAPI, internalOnly)
-  // globals.rpcAPI.exportAPI('followgraph', followgraphManifest, followgraphAPI, internalOnly)
 
   // external apis
   globals.rpcAPI.exportAPI('dat-archive', datArchiveManifest, datArchiveAPI, secureOnly)
@@ -76,6 +75,7 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('library', libraryManifest, libraryAPI, secureOnly)
   globals.rpcAPI.exportAPI('profiles', profilesManifest, profilesAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-feed', feedManifest, feedAPI, secureOnly)
+  globals.rpcAPI.exportAPI('unwalled-garden-followgraph', followgraphManifest, followgraphAPI, secureOnly)
 
   // experimental apis
   globals.rpcAPI.exportAPI('experimental-capture-page', experimentalCapturePageManifest, experimentalCapturePageAPI, secureOnly)
diff --git a/web-apis/bg/followgraph.js b/web-apis/bg/followgraph.js
deleted file mode 100644
index 8f1ff478..00000000
--- a/web-apis/bg/followgraph.js
+++ /dev/null
@@ -1,82 +0,0 @@
-const globals = require('../../globals')
-const assert = require('assert')
-const {URL} = require('url')
-const dat = require('../../dat')
-const followgraphCrawler = require('../../crawler/followgraph')
-
-// exported api
-// =
-
-module.exports = {
-
-  async listFollowers (url, opts) {
-    opts = opts || {}
-    url = normalizeFollowUrl(url)
-    assertString(url, 'Parameter one must be a URL')
-    var userSession = globals.userSessionAPI.getFor(this.sender)
-    if (!userSession) throw new Error('No active user session')
-    opts.followedBy = userSession.url
-    return followgraphCrawler.listFollowers(url, opts)
-  },
-
-  async listFollows (url, opts) {
-    opts = opts || {}
-    url = normalizeFollowUrl(url)
-    assertString(url, 'Parameter one must be a URL')
-    var userSession = globals.userSessionAPI.getFor(this.sender)
-    if (!userSession) throw new Error('No active user session')
-    opts.followedBy = userSession.url
-    return followgraphCrawler.listFollows(url, opts)
-  },
-
-  async listFoaFs (url, opts) {
-    opts = opts || {}
-    url = normalizeFollowUrl(url)
-    assertString(url, 'Parameter one must be a URL')
-    var userSession = globals.userSessionAPI.getFor(this.sender)
-    if (!userSession) throw new Error('No active user session')
-    opts.followedBy = userSession.url
-    return followgraphCrawler.listFoaFs(url, opts)
-  },
-
-  async isAFollowingB (a, b) {
-    a = normalizeFollowUrl(a)
-    b = normalizeFollowUrl(b)
-    assertString(a, 'Parameter one must be a URL')
-    assertString(b, 'Parameter two must be a URL')
-    return followgraphCrawler.isAFollowingB(a, b)
-  },
-
-  async follow (url) {
-    url = normalizeFollowUrl(url)
-    assertString(url, 'Parameter one must be a URL')
-    var userSession = globals.userSessionAPI.getFor(this.sender)
-    if (!userSession) throw new Error('No active user session')
-    var userArchive = dat.library.getArchive(userSession.url)
-    return followgraphCrawler.follow(userArchive, url)
-  },
-
-  async unfollow (url) {
-    url = normalizeFollowUrl(url)
-    assertString(url, 'Parameter one must be a URL')
-    var userSession = globals.userSessionAPI.getFor(this.sender)
-    if (!userSession) throw new Error('No active user session')
-    var userArchive = dat.library.getArchive(userSession.url)
-    return followgraphCrawler.unfollow(userArchive, url)
-  }
-}
-
-// internal methods
-// =
-
-function normalizeFollowUrl (url) {
-  try {
-    url = new URL(url)
-    return url.protocol + '//' + url.hostname
-  } catch (e) {}
-  return null
-}
-
-function assertString (v, msg) {
-  assert(!!v && typeof v === 'string', msg)
-}
diff --git a/web-apis/bg/unwalled-garden-feed.js b/web-apis/bg/unwalled-garden-feed.js
index ac466a6a..e81b5b17 100644
--- a/web-apis/bg/unwalled-garden-feed.js
+++ b/web-apis/bg/unwalled-garden-feed.js
@@ -3,7 +3,6 @@ const assert = require('assert')
 const {URL} = require('url')
 const {PermissionsError} = require('beaker-error-constants')
 const dat = require('../../dat')
-const archivesDb = require('../../dbs/archives')
 const feedCrawler = require('../../crawler/feed')
 
 // typedefs
@@ -14,8 +13,8 @@ const feedCrawler = require('../../crawler/feed')
  * @prop {string} url
  * @prop {string} title
  * @prop {string} description
- * @prop {Array<string>} type 
- * 
+ * @prop {Array<string>} type
+ *
  * @typedef {Object} FeedPostPublicAPIRecord
  * @prop {string} url
  * @prop {Object} content
@@ -68,7 +67,7 @@ module.exports = {
   },
 
   /**
-   * @param {Object} post 
+   * @param {Object} post
    * @param {Object} post.content
    * @param {string} post.content.body
    * @returns {Promise<void>}
@@ -82,14 +81,14 @@ module.exports = {
 
     var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
-    
+
     var userArchive = dat.library.getArchive(userSession.url)
     await feedCrawler.addPost(userArchive, post.content)
   },
 
   /**
    * @param {string} url
-   * @param {Object} post 
+   * @param {Object} post
    * @param {Object} post.content
    * @param {string} post.content.body
    * @returns {Promise<void>}
@@ -141,7 +140,7 @@ async function assertPermission (sender, perm) {
 
 /**
  * Tries to parse the URL and return the pathname. If fails, assumes the string was a pathname.
- * @param {string} url 
+ * @param {string} url
  * @returns {string}
  */
 function urlToPathname (url) {
diff --git a/web-apis/bg/unwalled-garden-followgraph.js b/web-apis/bg/unwalled-garden-followgraph.js
new file mode 100644
index 00000000..b0d01b10
--- /dev/null
+++ b/web-apis/bg/unwalled-garden-followgraph.js
@@ -0,0 +1,171 @@
+const globals = require('../../globals')
+const assert = require('assert')
+const {URL} = require('url')
+const {PermissionsError} = require('beaker-error-constants')
+const dat = require('../../dat')
+const followgraphCrawler = require('../../crawler/followgraph')
+
+// typedefs
+// =
+
+/**
+ * @typedef {Object} FollowgraphSitePublicAPIRecord
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {Array<string>} type
+ */
+
+// exported api
+// =
+
+module.exports = {
+  /**
+   * @param {string} url 
+   * @param {Object} [opts]
+   * @param {Object} [opts.filters]
+   * @param {string} [opts.filters.followedBy]
+   * @param {number} [opts.offset]
+   * @param {number} [opts.limit]
+   * @returns {Promise<FollowgraphSitePublicAPIRecord[]>}
+   */
+  async listFollowers (url, opts) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+
+    var query = {}
+    url = normalizeFollowUrl(url)
+    assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
+    if (opts && 'offset' in opts) {
+      assert(typeof opts.offset === 'number', 'Offset must be a number')
+      query.offset = opts.offset
+    }
+    if (opts && 'limit' in opts) {
+      assert(typeof opts.limit === 'number', 'Limit must be a number')
+      query.limit = opts.limit
+    }
+    if (opts && opts.filters) {
+      if ('followedBy' in opts.filters) {
+        opts.filters.followedBy = normalizeFollowUrl(opts.filters.followedBy)
+        assert(typeof opts.filters.followedBy === 'string', 'Followed-by filter must be a valid URL')
+        query.followedBy = opts.filters.followedBy
+      }
+    }
+    
+    query.includeDesc = true
+    return (await followgraphCrawler.listFollowers(url, opts)).map(massageSiteRecord)
+  },
+
+  /**
+   * @param {string} url 
+   * @param {Object} [opts]
+   * @param {Object} [opts.filters]
+   * @param {string} [opts.filters.followedBy]
+   * @param {number} [opts.offset]
+   * @param {number} [opts.limit]
+   * @returns {Promise<FollowgraphSitePublicAPIRecord[]>}
+   */
+  async listFollows (url, opts) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+
+    var query = {}
+    url = normalizeFollowUrl(url)
+    assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
+    if (opts && 'offset' in opts) {
+      assert(typeof opts.offset === 'number', 'Offset must be a number')
+      query.offset = opts.offset
+    }
+    if (opts && 'limit' in opts) {
+      assert(typeof opts.limit === 'number', 'Limit must be a number')
+      query.limit = opts.limit
+    }
+    if (opts && opts.filters) {
+      if ('followedBy' in opts.filters) {
+        opts.filters.followedBy = normalizeFollowUrl(opts.filters.followedBy)
+        assert(typeof opts.filters.followedBy === 'string', 'Followed-by filter must be a valid URL')
+        query.followedBy = opts.filters.followedBy
+      }
+    }
+    
+    query.includeDesc = true
+    return (await followgraphCrawler.listFollows(url, query)).map(massageSiteRecord)
+  },
+
+  /**
+   * @param {string} a
+   * @param {string} b
+   * @returns {Promise<boolean>}
+   */
+  async isAFollowingB (a, b) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+
+    a = normalizeFollowUrl(a)
+    b = normalizeFollowUrl(b)
+
+    assert(a, 'The `a` parameter must be a valid URL')
+    assert(b, 'The `b` parameter must be a valid URL')
+
+    return followgraphCrawler.isAFollowingB(a, b)
+  },
+
+  /**
+   * @param {string} url
+   * @returns {Promise<void>}
+   */
+  async follow (url) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+
+    url = normalizeFollowUrl(url)
+    assert(url, 'The `url` parameter must be a valid URL')
+    
+    var userSession = globals.userSessionAPI.getFor(this.sender)
+    if (!userSession) throw new Error('No active user session')
+    var userArchive = dat.library.getArchive(userSession.url)
+    
+    await followgraphCrawler.follow(userArchive, url)
+  },
+
+  /**
+   * @param {string} url
+   * @returns {Promise<void>}
+   */
+  async unfollow (url) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+
+    url = normalizeFollowUrl(url)
+    assert(url, 'The `url` parameter must be a valid URL')
+
+    var userSession = globals.userSessionAPI.getFor(this.sender)
+    if (!userSession) throw new Error('No active user session')
+    var userArchive = dat.library.getArchive(userSession.url)
+    
+    await followgraphCrawler.unfollow(userArchive, url)
+  }
+}
+
+// internal methods
+// =
+
+async function assertPermission (sender, perm) {
+  if (sender.getURL().startsWith('beaker:')) {
+    return true
+  }
+  if (await globals.permsAPI.requestPermission(perm, sender)) return true
+  throw new PermissionsError()
+}
+
+function normalizeFollowUrl (url) {
+  try {
+    url = new URL(url)
+    return url.protocol + '//' + url.hostname
+  } catch (e) {}
+  return null
+}
+
+function massageSiteRecord (site) {
+  return {
+    url: site.url,
+    title: site.title,
+    description: site.description,
+    type: site.type
+  }
+}
diff --git a/web-apis/fg/navigator-import.js b/web-apis/fg/navigator-import.js
index a04fbd89..269db542 100644
--- a/web-apis/fg/navigator-import.js
+++ b/web-apis/fg/navigator-import.js
@@ -48,8 +48,18 @@ const APIs = {
       }
       return api
     }
+  },
+  'unwalled-garden-followgraph': {
+    manifest: require('../manifests/external/unwalled-garden-followgraph'),
+    create (rpc) {
+      var feedRPC = rpc.importAPI('unwalled-garden-followgraph', APIs['unwalled-garden-followgraph'].manifest, RPC_OPTS)
+      var api = {}
+      for (let method in APIs['unwalled-garden-followgraph'].manifest) {
+        api[method] = feedRPC[method].bind(api)
+      }
+      return api
+    }
   }
-  // TODO 'unwalled-garden-followgraph': require('../manifests/external/unwalled-garden-followgraph')
 }
 
 var cache = {}
diff --git a/web-apis/manifests/internal/followgraph.js b/web-apis/manifests/external/unwalled-garden-followgraph.js
similarity index 85%
rename from web-apis/manifests/internal/followgraph.js
rename to web-apis/manifests/external/unwalled-garden-followgraph.js
index d4927e25..2cb0fd6d 100644
--- a/web-apis/manifests/internal/followgraph.js
+++ b/web-apis/manifests/external/unwalled-garden-followgraph.js
@@ -1,7 +1,6 @@
 module.exports = {
   listFollowers: 'promise',
   listFollows: 'promise',
-  listFoaFs: 'promise',
   isAFollowingB: 'promise',
   follow: 'promise',
   unfollow: 'promise'

From eb7965243fb7e702c74b2f0370acbd7da75e2223 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 20 Feb 2019 13:55:02 -0600
Subject: [PATCH 102/245] Update license year

---
 LICENSE | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/LICENSE b/LICENSE
index dcdc31b4..d1a38ee6 100644
--- a/LICENSE
+++ b/LICENSE
@@ -1,6 +1,6 @@
 MIT License
 
-Copyright (c) 2018 Blue Link Labs
+Copyright (c) 2019 Blue Link Labs
 
 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal

From 12f3f1cc7151b3180ae2173285ffb068ea6fdf43 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 20 Feb 2019 13:55:36 -0600
Subject: [PATCH 103/245] Add profiles.openProfileEditor()

---
 web-apis/bg/profiles.js                    | 12 ++++++++++++
 web-apis/bg/unwalled-garden-followgraph.js | 14 +++++++-------
 web-apis/manifests/external/profiles.js    |  3 ++-
 3 files changed, 21 insertions(+), 8 deletions(-)

diff --git a/web-apis/bg/profiles.js b/web-apis/bg/profiles.js
index 80175163..837cab50 100644
--- a/web-apis/bg/profiles.js
+++ b/web-apis/bg/profiles.js
@@ -48,6 +48,18 @@ module.exports = {
   async get (url) {
     await assertPermission(this.sender, 'dangerousAppControl')
     return get(url)
+  },
+
+  /**
+   * @returns {Promise<ProfilesPublicAPIRecord>}
+   */
+  async openProfileEditor () {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    var sess = globals.userSessionAPI.getFor(this.sender)
+    if (!sess) return null
+    var user = await get(sess.url)
+    await globals.userSessionAPI.openProfileEditor(this.sender, user)
+    return get(sess.url)
   }
 }
 
diff --git a/web-apis/bg/unwalled-garden-followgraph.js b/web-apis/bg/unwalled-garden-followgraph.js
index b0d01b10..a980286b 100644
--- a/web-apis/bg/unwalled-garden-followgraph.js
+++ b/web-apis/bg/unwalled-garden-followgraph.js
@@ -21,7 +21,7 @@ const followgraphCrawler = require('../../crawler/followgraph')
 
 module.exports = {
   /**
-   * @param {string} url 
+   * @param {string} url
    * @param {Object} [opts]
    * @param {Object} [opts.filters]
    * @param {string} [opts.filters.followedBy]
@@ -50,13 +50,13 @@ module.exports = {
         query.followedBy = opts.filters.followedBy
       }
     }
-    
+
     query.includeDesc = true
     return (await followgraphCrawler.listFollowers(url, opts)).map(massageSiteRecord)
   },
 
   /**
-   * @param {string} url 
+   * @param {string} url
    * @param {Object} [opts]
    * @param {Object} [opts.filters]
    * @param {string} [opts.filters.followedBy]
@@ -85,7 +85,7 @@ module.exports = {
         query.followedBy = opts.filters.followedBy
       }
     }
-    
+
     query.includeDesc = true
     return (await followgraphCrawler.listFollows(url, query)).map(massageSiteRecord)
   },
@@ -116,11 +116,11 @@ module.exports = {
 
     url = normalizeFollowUrl(url)
     assert(url, 'The `url` parameter must be a valid URL')
-    
+
     var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
     var userArchive = dat.library.getArchive(userSession.url)
-    
+
     await followgraphCrawler.follow(userArchive, url)
   },
 
@@ -137,7 +137,7 @@ module.exports = {
     var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
     var userArchive = dat.library.getArchive(userSession.url)
-    
+
     await followgraphCrawler.unfollow(userArchive, url)
   }
 }
diff --git a/web-apis/manifests/external/profiles.js b/web-apis/manifests/external/profiles.js
index ec0f400a..0a1e7811 100644
--- a/web-apis/manifests/external/profiles.js
+++ b/web-apis/manifests/external/profiles.js
@@ -1,4 +1,5 @@
 module.exports = {
   getCurrentUser: 'promise',
-  get: 'promise'
+  get: 'promise',
+  openProfileEditor: 'promise'
 }
\ No newline at end of file

From 4473d761fed9d810b01da42d5e1ba391782e3a69 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 21 Feb 2019 08:09:08 -0600
Subject: [PATCH 104/245] Add feed app to default relative domains

---
 lib/const.js | 1 +
 1 file changed, 1 insertion(+)

diff --git a/lib/const.js b/lib/const.js
index 2bcb4c33..df113b9a 100644
--- a/lib/const.js
+++ b/lib/const.js
@@ -66,6 +66,7 @@ exports.STANDARD_ARCHIVE_TYPES = [
 // the default applications
 exports.DEFAULT_RELATIVE_DOMAIN_NAMES = {
   start: '602dc80c3a89461d06e8a67c5ac27ef13085f42a60573a93504fa2b4746f7865',
+  feed: '602dc80c3a89461d06e8a67c5ac27ef13085f42a60573a93504fa2b4746f7865',
   library: 'e1c19fad6334e0897e9b95e633c2eee3a13003e097d9347cbfdd184d3a144975',
   bookmarks: 'd57fdfcf1cb81ee449c0633767f24583734ca6f7f878737007b10e35d7e0ec41',
   profile: '602dc80c3a89461d06e8a67c5ac27ef13085f42a60573a93504fa2b4746f7865',

From 1cf87ca816db300d9295cf03e8e4a002b378f16e Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 21 Feb 2019 10:48:36 -0600
Subject: [PATCH 105/245] Add 'search' importable web api

---
 crawler/search.js                          | 192 +++++++++++----------
 web-apis/bg.js                             |   3 +
 web-apis/bg/search.js                      |  70 ++++++++
 web-apis/bg/unwalled-garden-followgraph.js |   7 +-
 web-apis/fg/beaker.js                      |   1 -
 web-apis/fg/navigator-import.js            |  51 ++----
 web-apis/manifests/external/search.js      |   3 +
 web-apis/manifests/internal/crawler.js     |   1 -
 8 files changed, 201 insertions(+), 127 deletions(-)
 create mode 100644 web-apis/bg/search.js
 create mode 100644 web-apis/manifests/external/search.js

diff --git a/crawler/search.js b/crawler/search.js
index 4b7bb875..c3dda0e3 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -43,44 +43,34 @@ const BUILTIN_PAGES = [
  *
  * @typedef {Object} SearchResults
  * @prop {number} highlightNonce - A number used to create perimeters around text that should be highlighted.
- * @prop {Array<UserSearchResult|SiteSearchResult|PostSearchResult>} results
+ * @prop {Array<SiteSearchResult|PostSearchResult>} results
  *
- * @typedef {Object} UserSearchResult
- * @prop {string} recordType
+ * @typedef {Object} SearchResultAuthor
  * @prop {string} url
  * @prop {string} title
  * @prop {string} description
- * @prop {Array<SiteDescription>} followedBy
- * @prop {bool} followsUser
- * @prop {string} thumbUrl
- * @prop {Object} author
- * @prop {string} author.url
- *
- * @typedef {Object} PostSearchResult
- * @prop {string} recordType
+ * @prop {Array<string>} type
+ * 
+ * @typedef {Object} SearchResultRecord
+ * @prop {string} type
  * @prop {string} url
- * @prop {SiteDescription} author
- * @prop {string} recordFilepath
- * @prop {Object} content
- * @prop {string} content.url
- * @prop {string} content.title
- * @prop {string} content.description
- * @prop {Array<string>} content.type
  * @prop {number} crawledAt
- * @prop {number} createdAt
- * @prop {number} updatedAt
- *
+ * @prop {SearchResultAuthor} author
+ * 
  * @typedef {Object} SiteSearchResult
- * @prop {string} recordType
+ * @prop {SearchResultRecord} record
  * @prop {string} url
  * @prop {string} title
  * @prop {string} description
  * @prop {Array<string>} type
- * @prop {string} thumbUrl
- * @prop {Object} descAuthor
- * @prop {string} descAuthor.url
- * @prop {SiteDescription} author
- * @prop {string} recordFilepath
+ *
+ * @typedef {Object} PostSearchResult
+ * @prop {SearchResultRecord} record
+ * @prop {string} url
+ * @prop {Object} content
+ * @prop {string} content.body
+ * @prop {number} createdAt
+ * @prop {number} updatedAt
  */
 
 // exported api
@@ -136,18 +126,18 @@ exports.listSuggestions = async function (query = '', opts = {}) {
  * @description
  * Run a search query against crawled data.
  *
+ * @param {string} user - The current user's URL.
  * @param {Object} opts
- * @param {string} opts.user - The current user's URL.
  * @param {string} [opts.query] - The search query.
- * @param {number} [opts.hops=1] - How many hops out in the user's follow graph should be included?
- * @param {string[]} [opts.datasets] - Datasets to query. Defaults to all. Valid values: 'followgraph', 'posts'.
- * @param {string[]} [opts.siteTypes] - Site types to query. Defaults to all.
- * @param {number} [opts.since] - Filter results to items created since the given timestamp.
+ * @param {Object} [opts.filters]
+ * @param {string|string[]} [opts.filters.datasets] - Filter results to the given datasets. Defaults to 'all'. Valid values: 'all', 'sites', 'unwalled.garden/post'.
+ * @param {number} [opts.filters.since] - Filter results to items created since the given timestamp.
+ * @param {number} [opts.hops=1] - How many hops out in the user's follow graph should be included? Valid values: 1, 2.
  * @param {number} [opts.offset]
  * @param {number} [opts.limit = 20]
  * @returns {Promise<SearchResults>}
  */
-exports.listSearchResults = async function (opts) {
+exports.query = async function (user, opts) {
   const highlightNonce =  (Math.random() * 1e3)|0
   const startHighlight = `{${highlightNonce}}`
   const endHighlight = `{/${highlightNonce}}`
@@ -156,13 +146,21 @@ exports.listSearchResults = async function (opts) {
     highlightNonce,
     results: []
   }
-  var {user, query, hops, datasets, siteTypes, since, offset, limit} = opts
-  since = since || 0
-  offset = offset || 0
-  limit = limit || 20
+  var {query, hops, filters, offset, limit} = Object.assign({}, {
+    query: undefined,
+    hops: 1,
+    filters: {},
+    offset: 0,
+    limit: 20
+  }, opts)
+  var {datasets, since} = Object.assign({}, {
+    datasets: 'all',
+    since: 0
+  }, filters)
   hops = Math.min(Math.max(Math.floor(hops), 1), 2) // clamp to [1, 2] for now
-  if (typeof datasets === 'string') datasets = [datasets]
-  if (typeof siteTypes === 'string') siteTypes = [siteTypes]
+  var datasetValues = (typeof datasets === 'undefined')
+    ? ['all']
+    : Array.isArray(datasets) ? datasets : [datasets]
 
   // prep search terms
   if (query && typeof query === 'string') {
@@ -194,14 +192,13 @@ exports.listSearchResults = async function (opts) {
   }
 
   // run queries
-  if (!datasets || datasets.includes('followgraph')) {
-    // FOLLOWGRAPH
-    let rows = await db.all(buildFollowGraphSearchQuery({
+  if (datasetValues.includes('all') || datasetValues.includes('sites')) {
+    // SITES
+    let rows = await db.all(buildSitesSearchQuery({
       query,
       crawlSourceIds,
       user,
       userCrawlSourceId,
-      siteTypes,
       since,
       limit,
       offset,
@@ -209,53 +206,23 @@ exports.listSearchResults = async function (opts) {
       endHighlight
     }))
     rows = _uniqWith(rows, (a, b) => a.url === b.url) // remove duplicates
-    await Promise.all(rows.map(async (p) => {
-      // fetch additional info
-      p.followedBy = await followgraph.listFollowers(p.url, {includeDesc: true})
-      p.followsUser = await followgraph.isAFollowingB(p.url, user)
-
-      // massage attrs
-      p.recordType = 'user'
-      p.thumbUrl = getSiteDescriptionThumbnailUrl(p.authorUrl, p.url)
-      p.author = {url: p.authorUrl}
-      delete p.authorUrl
-    }))
+    rows = await Promise.all(rows.map(massageSiteSearchResult))
     searchResults.results = searchResults.results.concat(rows)
   }
-  if (!datasets || datasets.includes('posts')) {
+  if (datasetValues.includes('all') || datasets.includes('unwalled.garden/post')) {
     // POSTS
     let rows = await db.all(buildPostsSearchQuery({
       query,
       crawlSourceIds,
       userCrawlSourceId,
-      siteTypes,
       since,
       limit,
       offset,
       startHighlight,
       endHighlight
     }))
-    searchResults.results = searchResults.results.concat(await Promise.all(rows.map(async (p) => {
-      // fetch additional info
-      var author = await siteDescriptions.getBest({subject: p.authorUrl})
-
-      // massage attrs
-      return {
-        recordType: 'post',
-        recordFilepath: p.recordFilepath,
-        url: p.authorUrl + p.pathname,
-        author,
-        content: {
-          url: p.url,
-          title: p.title,
-          description: p.description,
-          type: p.type.split(',')
-        },
-        crawledAt: p.crawledAt,
-        createdAt: p.createdAt,
-        updatedAt: p.updatedAt
-      }
-    })))
+    rows = await Promise.all(rows.map(massagePostSearchResult))
+    searchResults.results = searchResults.results.concat(rows)
   }
 
   // sort and apply limit again
@@ -268,7 +235,7 @@ exports.listSearchResults = async function (opts) {
 // internal methods
 // =
 
-function buildFollowGraphSearchQuery ({query, crawlSourceIds, user, userCrawlSourceId, siteTypes, since, limit, offset, startHighlight, endHighlight}) {
+function buildSitesSearchQuery ({query, crawlSourceIds, user, userCrawlSourceId, since, limit, offset, startHighlight, endHighlight}) {
   let sql = knex(query ? 'crawl_site_descriptions_fts_index' : 'crawl_site_descriptions')
     .select('crawl_site_descriptions.url AS url')
     .select('crawl_sources.url AS authorUrl')
@@ -299,17 +266,15 @@ function buildFollowGraphSearchQuery ({query, crawlSourceIds, user, userCrawlSou
       .leftJoin('crawl_followgraph', 'crawl_followgraph.destUrl', '=', 'crawl_site_descriptions.url')
       .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_site_descriptions.crawlSourceId')
   }
-  sql = addSiteTypesClause(sql, siteTypes, 'crawl_site_descriptions')
   return sql
 }
 
-function buildPostsSearchQuery ({query, crawlSourceIds, userCrawlSourceId, siteTypes, since, limit, offset, startHighlight, endHighlight}) {
+function buildPostsSearchQuery ({query, crawlSourceIds, userCrawlSourceId, since, limit, offset, startHighlight, endHighlight}) {
   let sql = knex(query ? 'crawl_posts_fts_index' : 'crawl_posts')
     .select('crawl_posts.pathname')
     .select('crawl_posts.crawledAt')
     .select('crawl_posts.createdAt')
     .select('crawl_posts.updatedAt')
-    .select('crawl_posts.pathname AS recordFilepath')
     .select('crawl_sources.url AS authorUrl')
     .where(builder => builder
       .whereIn('crawl_followgraph.crawlSourceId', crawlSourceIds) // published by someone I follow
@@ -330,19 +295,64 @@ function buildPostsSearchQuery ({query, crawlSourceIds, userCrawlSourceId, siteT
     sql = sql
       .select('crawl_posts.body')
       .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_posts.crawlSourceId')
-      .leftJoin('crawl_followgraph', 'crawl_followgraph.destUrl', '=', 'crawl_posts.url')
+      .leftJoin('crawl_followgraph', 'crawl_followgraph.destUrl', '=', 'crawl_sources.url')
   }
-  sql = addSiteTypesClause(sql, siteTypes, 'crawl_posts')
   return sql
 }
 
-function addSiteTypesClause (sql, siteTypes, table) {
-  if (siteTypes && siteTypes.length) {
-    sql = sql.where(builder => {
-      for (let t of siteTypes) {
-        builder = builder.orWhereRaw(`(',' || ${table}.type || ',') LIKE ?`, `%,${t},%`)
-      }
-    })
+/**
+ * @param {Object} row
+ * @returns {Promise<SiteSearchResult>}
+ */
+async function massageSiteSearchResult (row) {
+  // fetch additional info
+  var author = await siteDescriptions.getBest({subject: row.authorUrl})
+
+  // massage attrs
+  return {
+    record: {
+      type: 'site',
+      url: row.url,
+      author: {
+        url: author.url,
+        title: author.title,
+        description: author.description,
+        type: author.type
+      },
+      crawledAt: row.crawledAt,
+    },
+    url: row.url,
+    title: row.title,
+    description: row.description,
+    type: row.type
+  }
+}
+
+/**
+ * @param {Object} row
+ * @returns {Promise<PostSearchResult>}
+ */
+async function massagePostSearchResult (row) {
+  // fetch additional info
+  var author = await siteDescriptions.getBest({subject: row.authorUrl})
+
+  // massage attrs
+  var url = row.authorUrl + row.pathname
+  return {
+    record: {
+      type: 'unwalled.garden/post',
+      url,
+      author: {
+        url: author.url,
+        title: author.title,
+        description: author.description,
+        type: author.type
+      },
+      crawledAt: row.crawledAt,
+    },
+    url,
+    content: {body: row.body},
+    createdAt: row.createdAt,
+    updatedAt: row.updatedAt
   }
-  return sql
 }
\ No newline at end of file
diff --git a/web-apis/bg.js b/web-apis/bg.js
index 03de803a..93930976 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -30,6 +30,7 @@ const spellCheckerManifest = require('./manifests/external/spell-checker')
 const bookmarksManifest = require('./manifests/external/bookmarks')
 const libraryManifest = require('./manifests/external/library')
 const profilesManifest = require('./manifests/external/profiles')
+const searchManifest = require('./manifests/external/search')
 const feedManifest = require('./manifests/external/unwalled-garden-feed')
 const followgraphManifest = require('./manifests/external/unwalled-garden-followgraph')
 
@@ -39,6 +40,7 @@ const spellCheckerAPI = require('./bg/spell-checker')
 const bookmarksAPI = require('./bg/bookmarks')
 const libraryAPI = require('./bg/library')
 const profilesAPI = require('./bg/profiles')
+const searchAPI = require('./bg/search')
 const feedAPI = require('./bg/unwalled-garden-feed')
 const followgraphAPI = require('./bg/unwalled-garden-followgraph')
 
@@ -74,6 +76,7 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('bookmarks', bookmarksManifest, bookmarksAPI, secureOnly)
   globals.rpcAPI.exportAPI('library', libraryManifest, libraryAPI, secureOnly)
   globals.rpcAPI.exportAPI('profiles', profilesManifest, profilesAPI, secureOnly)
+  globals.rpcAPI.exportAPI('search', searchManifest, searchAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-feed', feedManifest, feedAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-followgraph', followgraphManifest, followgraphAPI, secureOnly)
 
diff --git a/web-apis/bg/search.js b/web-apis/bg/search.js
new file mode 100644
index 00000000..11f047db
--- /dev/null
+++ b/web-apis/bg/search.js
@@ -0,0 +1,70 @@
+const globals = require('../../globals')
+const {PermissionsError} = require('beaker-error-constants')
+const crawler = require('../../crawler/search')
+
+// typedefs
+// =
+
+/**
+ * @typedef {Object} SearchPublicAPIResult
+ * @prop {number} highlightNonce - A number used to create perimeters around text that should be highlighted.
+ * @prop {Array<SearchPublicAPISiteResult|SearchPublicAPIPostResult>} results
+ *
+ * @typedef {Object} SearchPublicAPIResultAuthor
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {Array<string>} type
+ * 
+ * @typedef {Object} SearchPublicAPIResultRecord
+ * @prop {string} type
+ * @prop {string} url
+ * @prop {number} crawledAt
+ * @prop {SearchPublicAPIResultAuthor} author
+ * 
+ * @typedef {Object} SearchPublicAPISiteResult
+ * @prop {SearchPublicAPIResultRecord} record
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {Array<string>} type
+ *
+ * @typedef {Object} SearchPublicAPIPostResult
+ * @prop {SearchPublicAPIResultRecord} record
+ * @prop {string} url
+ * @prop {Object} content
+ * @prop {string} content.body
+ * @prop {number} createdAt
+ * @prop {number} updatedAt
+ */
+
+// exported api
+// =
+
+module.exports = {
+  /**
+   * @param {Object} opts
+   * @param {string} [opts.query] - The search query.
+   * @param {Object} [opts.filters]
+   * @param {string|string[]} [opts.filters.datasets] - Filter results to the given datasets. Defaults to 'all'. Valid values: 'all', 'sites', 'unwalled.garden/post'.
+   * @param {number} [opts.filters.since] - Filter results to items created since the given timestamp.
+   * @param {number} [opts.hops=1] - How many hops out in the user's follow graph should be included? Valid values: 1, 2.
+   * @param {number} [opts.offset]
+   * @param {number} [opts.limit = 20]
+   * @returns {Promise<SearchPublicAPIResult>}
+   */
+  async query (opts) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    var sess = globals.userSessionAPI.getFor(this.sender)
+    if (!sess) return null
+    return crawler.query(sess.url, opts)
+  }
+}
+
+async function assertPermission (sender, perm) {
+  if (sender.getURL().startsWith('beaker:')) {
+    return true
+  }
+  if (await globals.permsAPI.requestPermission(perm, sender)) return true
+  throw new PermissionsError()
+}
diff --git a/web-apis/bg/unwalled-garden-followgraph.js b/web-apis/bg/unwalled-garden-followgraph.js
index a980286b..913be00f 100644
--- a/web-apis/bg/unwalled-garden-followgraph.js
+++ b/web-apis/bg/unwalled-garden-followgraph.js
@@ -52,7 +52,8 @@ module.exports = {
     }
 
     query.includeDesc = true
-    return (await followgraphCrawler.listFollowers(url, opts)).map(massageSiteRecord)
+    var followers = await followgraphCrawler.listFollowers(url, opts)
+    return followers.map(massageSiteRecord)
   },
 
   /**
@@ -87,7 +88,9 @@ module.exports = {
     }
 
     query.includeDesc = true
-    return (await followgraphCrawler.listFollows(url, query)).map(massageSiteRecord)
+    var follows = await followgraphCrawler.listFollows(url, query)
+    console.log(follows, follows.map(massageSiteRecord))
+    return follows.map(massageSiteRecord)
   },
 
   /**
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index d3443be6..fa29838b 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -164,7 +164,6 @@ exports.setup = function (rpc) {
     // beaker.crawler
     beaker.crawler = {}
     beaker.crawler.listSuggestions = crawlerRPC.listSuggestions
-    beaker.crawler.listSearchResults = crawlerRPC.listSearchResults
     beaker.crawler.getCrawlStates = crawlerRPC.getCrawlStates
     beaker.crawler.crawlSite = crawlerRPC.crawlSite
     beaker.crawler.resetSite = crawlerRPC.resetSite
diff --git a/web-apis/fg/navigator-import.js b/web-apis/fg/navigator-import.js
index 269db542..8987e163 100644
--- a/web-apis/fg/navigator-import.js
+++ b/web-apis/fg/navigator-import.js
@@ -5,14 +5,7 @@ const RPC_OPTS = { timeout: false, errors }
 const APIs = {
   bookmarks: {
     manifest: require('../manifests/external/bookmarks'),
-    create (rpc) {
-      var bookmarksRPC = rpc.importAPI('bookmarks', APIs.bookmarks.manifest, RPC_OPTS)
-      var api = {}
-      for (let method in APIs.bookmarks.manifest) {
-        api[method] = bookmarksRPC[method].bind(api)
-      }
-      return api
-    }
+    create: makeCreateFn('bookmarks')
   },
   library: {
     manifest: require('../manifests/external/library'),
@@ -29,36 +22,19 @@ const APIs = {
   },
   profiles: {
     manifest: require('../manifests/external/profiles'),
-    create (rpc) {
-      var profilesRPC = rpc.importAPI('profiles', APIs.profiles.manifest, RPC_OPTS)
-      var api = {}
-      for (let method in APIs.profiles.manifest) {
-        api[method] = profilesRPC[method].bind(api)
-      }
-      return api
-    }
+    create: makeCreateFn('profiles')
+  },
+  search: {
+    manifest: require('../manifests/external/search'),
+    create: makeCreateFn('search')
   },
   'unwalled-garden-feed': {
     manifest: require('../manifests/external/unwalled-garden-feed'),
-    create (rpc) {
-      var feedRPC = rpc.importAPI('unwalled-garden-feed', APIs['unwalled-garden-feed'].manifest, RPC_OPTS)
-      var api = {}
-      for (let method in APIs['unwalled-garden-feed'].manifest) {
-        api[method] = feedRPC[method].bind(api)
-      }
-      return api
-    }
+    create: makeCreateFn('unwalled-garden-feed')
   },
   'unwalled-garden-followgraph': {
     manifest: require('../manifests/external/unwalled-garden-followgraph'),
-    create (rpc) {
-      var feedRPC = rpc.importAPI('unwalled-garden-followgraph', APIs['unwalled-garden-followgraph'].manifest, RPC_OPTS)
-      var api = {}
-      for (let method in APIs['unwalled-garden-followgraph'].manifest) {
-        api[method] = feedRPC[method].bind(api)
-      }
-      return api
-    }
+    create: makeCreateFn('unwalled-garden-followgraph')
   }
 }
 
@@ -74,4 +50,15 @@ exports.setup = function (rpc) {
     }
     throw new Error(`Unknown API: ${name}`)
   }
+}
+
+function makeCreateFn (name) {
+  return rpc => {
+    var rpcInst = rpc.importAPI(name, APIs[name].manifest, RPC_OPTS)
+    var api = {}
+    for (let method in APIs[name].manifest) {
+      api[method] = rpcInst[method].bind(api)
+    }
+    return api
+  }
 }
\ No newline at end of file
diff --git a/web-apis/manifests/external/search.js b/web-apis/manifests/external/search.js
new file mode 100644
index 00000000..4dc698c6
--- /dev/null
+++ b/web-apis/manifests/external/search.js
@@ -0,0 +1,3 @@
+module.exports = {
+  query: 'promise'
+}
\ No newline at end of file
diff --git a/web-apis/manifests/internal/crawler.js b/web-apis/manifests/internal/crawler.js
index af7554a2..2cd65b21 100644
--- a/web-apis/manifests/internal/crawler.js
+++ b/web-apis/manifests/internal/crawler.js
@@ -1,6 +1,5 @@
 module.exports = {
   listSuggestions: 'promise',
-  listSearchResults: 'promise',
   getCrawlStates: 'promise',
   crawlSite: 'promise',
   resetSite: 'promise',

From 55459cc6895cd0011a57b691fa9dbd2dae109698 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 21 Feb 2019 14:41:38 -0600
Subject: [PATCH 106/245] Fix the sorting of the search output

---
 crawler/search.js     | 6 +++---
 web-apis/bg/search.js | 4 ++--
 2 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/crawler/search.js b/crawler/search.js
index c3dda0e3..ce7d5d97 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -50,13 +50,13 @@ const BUILTIN_PAGES = [
  * @prop {string} title
  * @prop {string} description
  * @prop {Array<string>} type
- * 
+ *
  * @typedef {Object} SearchResultRecord
  * @prop {string} type
  * @prop {string} url
  * @prop {number} crawledAt
  * @prop {SearchResultAuthor} author
- * 
+ *
  * @typedef {Object} SiteSearchResult
  * @prop {SearchResultRecord} record
  * @prop {string} url
@@ -226,7 +226,7 @@ exports.query = async function (user, opts) {
   }
 
   // sort and apply limit again
-  searchResults.results.sort((a, b) => b.crawledAt - a.crawledAt)
+  searchResults.results.sort((a, b) => b.record.crawledAt - a.record.crawledAt)
   searchResults.results = searchResults.results.slice(0, limit)
 
   return searchResults
diff --git a/web-apis/bg/search.js b/web-apis/bg/search.js
index 11f047db..bd59177e 100644
--- a/web-apis/bg/search.js
+++ b/web-apis/bg/search.js
@@ -15,13 +15,13 @@ const crawler = require('../../crawler/search')
  * @prop {string} title
  * @prop {string} description
  * @prop {Array<string>} type
- * 
+ *
  * @typedef {Object} SearchPublicAPIResultRecord
  * @prop {string} type
  * @prop {string} url
  * @prop {number} crawledAt
  * @prop {SearchPublicAPIResultAuthor} author
- * 
+ *
  * @typedef {Object} SearchPublicAPISiteResult
  * @prop {SearchPublicAPIResultRecord} record
  * @prop {string} url

From 6ccb6d7ca51004adea223d151fbcdb6a784c5e09 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 21 Feb 2019 14:59:53 -0600
Subject: [PATCH 107/245] Improve non-FQDN lookup times by checking local
 mappings before the system's DNS resolver

---
 dat/dns.js | 28 +++++++++++++++-------------
 1 file changed, 15 insertions(+), 13 deletions(-)

diff --git a/dat/dns.js b/dat/dns.js
index 4299ca6b..d711666f 100644
--- a/dat/dns.js
+++ b/dat/dns.js
@@ -1,3 +1,4 @@
+const parseDatURL = require('parse-dat-url')
 const {InvalidDomainName} = require('beaker-error-constants')
 const sitedataDb = require('../dbs/sitedata')
 const domainNamesDb = require('../dbs/domain-names')
@@ -17,7 +18,18 @@ datDns.on('cache-flushed', details => logger.debug('Cache flushed'))
 
 // wrap resolveName() with a better error
 const resolveName = datDns.resolveName
-datDns.resolveName = function () {
+datDns.resolveName = async function (name, opts, cb) {
+  var nameParsed = parseDatURL(name)
+  var hostname = nameParsed.hostname || nameParsed.pathname
+  const isRelativeName = !hostname.includes('.')
+  if (isRelativeName) {
+    // check local mapping
+    let record = await domainNamesDb.get(hostname)
+    if (record) {
+      return record.value
+    }
+  }
+
   return resolveName.apply(datDns, arguments)
     .catch(_ => {
       throw new InvalidDomainName()
@@ -27,18 +39,8 @@ datDns.resolveName = function () {
 // persistent cache methods
 const sitedataDbOpts = {dontExtractOrigin: true}
 async function read (name, err) {
-  var key
-  const isRelativeName = !name.includes('.')
-  if (isRelativeName) {
-    // check local mapping
-    let record = await domainNamesDb.get(name)
-    if (record) {
-      key = record.value
-    }
-  } else {
-    // check the cache
-    key = await sitedataDb.get('dat:' + name, 'dat-key', sitedataDbOpts)
-  }
+  // check the cache
+  var key = await sitedataDb.get('dat:' + name, 'dat-key', sitedataDbOpts)
   if (!key) throw err
   return key
 }

From 93ec486bc583ccdb09eb8b22690e375fdbd7a386 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 22 Feb 2019 08:47:26 -0600
Subject: [PATCH 108/245] Fix bug in listFollowers() call

---
 web-apis/bg/unwalled-garden-followgraph.js | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/web-apis/bg/unwalled-garden-followgraph.js b/web-apis/bg/unwalled-garden-followgraph.js
index 913be00f..6771fb9d 100644
--- a/web-apis/bg/unwalled-garden-followgraph.js
+++ b/web-apis/bg/unwalled-garden-followgraph.js
@@ -52,7 +52,7 @@ module.exports = {
     }
 
     query.includeDesc = true
-    var followers = await followgraphCrawler.listFollowers(url, opts)
+    var followers = await followgraphCrawler.listFollowers(url, query)
     return followers.map(massageSiteRecord)
   },
 
@@ -89,7 +89,6 @@ module.exports = {
 
     query.includeDesc = true
     var follows = await followgraphCrawler.listFollows(url, query)
-    console.log(follows, follows.map(massageSiteRecord))
     return follows.map(massageSiteRecord)
   },
 

From 7590f00e3997b28f3ea7bad0b669aaf230e11278 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 22 Feb 2019 08:49:06 -0600
Subject: [PATCH 109/245] Get the best description possible when listing
 follows (not just the author's)

---
 crawler/followgraph.js | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/crawler/followgraph.js b/crawler/followgraph.js
index d466ec66..2c304ea3 100644
--- a/crawler/followgraph.js
+++ b/crawler/followgraph.js
@@ -215,7 +215,7 @@ const listFollows = exports.listFollows = async function (subject, {followedBy,
   }
   return Promise.all(rows.map(async (row) => {
     var url = toOrigin(row.destUrl)
-    var desc = /** @type SiteDescription */ ((await siteDescriptions.getBest({subject: url, author: subject})) || {})
+    var desc = /** @type SiteDescription */ ((await siteDescriptions.getBest({subject: url})) || {})
     desc.url = url
     if (followedBy) {
       desc.followsUser = await isAFollowingB(url, followedBy)

From ca800d89ac8d6b459bbe79bad7d0409aeba3a41b Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 22 Feb 2019 12:12:33 -0600
Subject: [PATCH 110/245] Remove legacy 'dat type' code

---
 crawler/search.js |  3 +-
 lib/dat.js        | 76 -----------------------------------------------
 2 files changed, 1 insertion(+), 78 deletions(-)
 delete mode 100644 lib/dat.js

diff --git a/crawler/search.js b/crawler/search.js
index ce7d5d97..a993b197 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -6,7 +6,6 @@ const historyDb = require('../dbs/history')
 const datLibrary = require('../dat/library')
 const followgraph = require('./followgraph')
 const siteDescriptions = require('./site-descriptions')
-const {getBasicType} = require('../lib/dat')
 const {getSiteDescriptionThumbnailUrl} = require('./util')
 const knex = require('../lib/knex')
 
@@ -95,7 +94,7 @@ exports.listSuggestions = async function (query = '', opts = {}) {
   // library
   var libraryResults = /** @type LibraryArchiveRecord[] */(await datLibrary.queryArchives({isSaved: true}))
   libraryResults = libraryResults.filter(filterFn)
-  var libraryResultsGrouped = _groupBy(libraryResults, a => getBasicType(a.type))
+  var libraryResultsGrouped = _groupBy(libraryResults, a => 'todo') //getBasicType(a.type))
   suggestions.people = libraryResultsGrouped.user
   suggestions.webPages = libraryResultsGrouped['web-page']
   suggestions.fileShares = libraryResultsGrouped['file-share']
diff --git a/lib/dat.js b/lib/dat.js
deleted file mode 100644
index 6af626f6..00000000
--- a/lib/dat.js
+++ /dev/null
@@ -1,76 +0,0 @@
-/**
- * @description
- * Get the first unwalled.garden type
- * @param {string|string[]} type
- * @returns {string}
- */
-const getUnwalledGardenType =
-exports.getUnwalledGardenType = function (type) {
-  if (typeof type === 'string') {
-    type = type.split(',')
-  }
-  if (!type) return
-  return type.find(v => v.startsWith('unwalled.garden/'))
-}
-
-/**
- * @description
- * Get a short-from of the unwalled.garden type.
- * @param {string|string[]} type
- * @returns {string}
- * @example
- *   getShortenedUnwalledGardenType('unwalled.garden/user') // 'user'
- *   getShortenedUnwalledGardenType('unwalled.garden/channel/blog') // 'channel-blog'
- *   getShortenedUnwalledGardenType('unwalled.garden/media/photo') // 'media-photo'
- */
-exports.getShortenedUnwalledGardenType = function (type) {
-  type = getUnwalledGardenType(type)
-  if (type) {
-    type = type.slice('unwalled.garden/'.length)
-    return type.replace(/\//g, '-')
-  }
-}
-
-/**
- * @description
- * Get the "basic type" of the dat.
- * "Basic types" are generic descriptions which are used mainly for categorization.
- * @param {string|string[]} type
- * @returns {string}
- */
-exports.getBasicType = function (type) {
-  type = getUnwalledGardenType(type)
-  if (type) {
-    if (type.startsWith('unwalled.garden/channel/')) return 'channel'
-    if (type.startsWith('unwalled.garden/media/')) return 'media'
-    switch (type) {
-      case 'unwalled.garden/person':
-      case 'unwalled.garden/organization':
-      case 'unwalled.garden/project':
-      case 'unwalled.garden/bot':
-      case 'unwalled.garden/place':
-        return 'user'
-    }
-  }
-  return 'other'
-}
-
-/**
- * @description
- * Get a human-readable label for a dat type
- * @param {string|string[]} type
- * @param {string} [fallback]
- * @returns {string}
- */
-exports.getTypeLabel = function (type, fallback = 'site') {
-  var t = getUnwalledGardenType(type)
-  if (!t) return fallback
-
-  // special case some items
-  if (t === 'unwalled.garden/channel/music') return 'music stream'
-  if (t === 'unwalled.garden/channel/video') return 'video stream'
-  if (t === 'unwalled.garden/channel/photo') return 'photo stream'
-
-  // most other items can just extract from the type-url
-  return t.split('/').pop().replace(/-/g, ' ')
-}

From f8e3c21b4b0bd104024851d7f9402a9310872e00 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 5 Mar 2019 12:01:37 -0600
Subject: [PATCH 111/245] Remove custom dat:// domain names (nice thought, not
 ready)

---
 dat/dns.js                          | 12 ----
 dbs/domain-names.js                 | 92 -----------------------------
 dbs/schemas/profile-data.sql.js     |  7 ---
 dbs/schemas/profile-data.v24.sql.js |  7 ---
 4 files changed, 118 deletions(-)
 delete mode 100644 dbs/domain-names.js

diff --git a/dat/dns.js b/dat/dns.js
index d711666f..055ca105 100644
--- a/dat/dns.js
+++ b/dat/dns.js
@@ -1,7 +1,6 @@
 const parseDatURL = require('parse-dat-url')
 const {InvalidDomainName} = require('beaker-error-constants')
 const sitedataDb = require('../dbs/sitedata')
-const domainNamesDb = require('../dbs/domain-names')
 const {DAT_HASH_REGEX} = require('../lib/const')
 const logger = require('../logger').child({category: 'dat', subcategory: 'dns'})
 
@@ -19,17 +18,6 @@ datDns.on('cache-flushed', details => logger.debug('Cache flushed'))
 // wrap resolveName() with a better error
 const resolveName = datDns.resolveName
 datDns.resolveName = async function (name, opts, cb) {
-  var nameParsed = parseDatURL(name)
-  var hostname = nameParsed.hostname || nameParsed.pathname
-  const isRelativeName = !hostname.includes('.')
-  if (isRelativeName) {
-    // check local mapping
-    let record = await domainNamesDb.get(hostname)
-    if (record) {
-      return record.value
-    }
-  }
-
   return resolveName.apply(datDns, arguments)
     .catch(_ => {
       throw new InvalidDomainName()
diff --git a/dbs/domain-names.js b/dbs/domain-names.js
deleted file mode 100644
index 1eba9fc5..00000000
--- a/dbs/domain-names.js
+++ /dev/null
@@ -1,92 +0,0 @@
-const db = require('./profile-data-db')
-const {DEFAULT_RELATIVE_DOMAIN_NAMES} = require('../lib/const')
-
-// typedefs
-// =
-
-/**
- * @typedef {Object} DomainName
- * @prop {string} name
- * @prop {string} value
- * @prop {number} updatedAt
- * @prop {boolean} isDefault
- */
-
-// exported methods
-// =
-
-/**
- * @param {string} name
- * @param {string} value
- * @returns {Promise<void>}
- */
-exports.set = async function (name, value) {
-  // validate
-  const isFQDN = name.includes('.')
-  if (isFQDN) {
-    throw new Error('You cannot override domains with TLDs. For example, you can set "beaker" but not "beaker.com".')
-  }
-
-  // update record
-  await db.run(`
-    INSERT OR REPLACE
-      INTO domain_names (name, value)
-      VALUES (?, ?)
-  `, [name, value])
-}
-
-/**
- * @param {string} name
- * @returns {Promise<void>}
- */
-exports.delete = async function (name) {
-  await db.run(`DELETE FROM domain_names WHERE name = ?`, [name])
-}
-
-/**
- * @param {string} name
- * @returns {Promise<DomainName>}
- */
-exports.get = async function (name) {
-  var record
-  try {
-    record = await db.get(`SELECT name, value, updatedAt FROM domain_names WHERE name = ?`, [name])
-  } catch (e) {
-    console.error('Failed to read domain_name record', e)
-  }
-  if (record) {
-    record.isDefault = false
-  } else {
-    // fallback to defaults
-    if (name in DEFAULT_RELATIVE_DOMAIN_NAMES) {
-      record = {
-        name,
-        value: DEFAULT_RELATIVE_DOMAIN_NAMES[name],
-        updatedAt: undefined,
-        isDefault: true
-      }
-    }
-  }
-  return record
-}
-
-/**
- * @returns {Promise<Array<DomainName>>}
- */
-exports.list = async function () {
-  var records = await db.all(`SELECT name, value, updatedAt FROM domain_names`)
-
-  // merge in defaults
-  for (let name in DEFAULT_RELATIVE_DOMAIN_NAMES) {
-    if (!records.find(r => r.name === name)) {
-      records.push({
-        name,
-        value: DEFAULT_RELATIVE_DOMAIN_NAMES,
-        updatedAt: undefined,
-        isDefault: true
-      })
-    }
-  }
-
-  return records
-}
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index d103d981..ddff4bf9 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -112,13 +112,6 @@ CREATE TABLE templates (
   FOREIGN KEY (profileId) REFERENCES profiles (id) ON DELETE CASCADE
 );
 
--- user-assigned relative domain names
-CREATE TABLE domain_names (
-  name TEXT NOT NULL,
-  value TEXT NOT NULL,
-  updatedAt INTEGER DEFAULT (strftime('%s', 'now'))
-);
-
 -- list of sites being crawled
 CREATE TABLE crawl_sources (
   id INTEGER PRIMARY KEY NOT NULL,
diff --git a/dbs/schemas/profile-data.v24.sql.js b/dbs/schemas/profile-data.v24.sql.js
index 0f6f8b66..a18af276 100644
--- a/dbs/schemas/profile-data.v24.sql.js
+++ b/dbs/schemas/profile-data.v24.sql.js
@@ -7,13 +7,6 @@ CREATE TABLE users (
   createdAt INTEGER
 );
 
--- user-assigned relative domain names
-CREATE TABLE domain_names (
-  name TEXT NOT NULL,
-  value TEXT NOT NULL,
-  updatedAt INTEGER DEFAULT (strftime('%s', 'now'))
-);
-
 -- list of sites being crawled
 CREATE TABLE crawl_sources (
   id INTEGER PRIMARY KEY NOT NULL,

From ba98255de7ac60fc4f72f77b9d88ef5547bcb009 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 6 Mar 2019 11:28:15 -0600
Subject: [PATCH 112/245] Remove leftover domain-names code

---
 web-apis/bg.js                              |  3 ---
 web-apis/fg/beaker.js                       | 10 ----------
 web-apis/manifests/internal/domain-names.js |  6 ------
 3 files changed, 19 deletions(-)
 delete mode 100644 web-apis/manifests/internal/domain-names.js

diff --git a/web-apis/bg.js b/web-apis/bg.js
index 93930976..1cf3417a 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -9,7 +9,6 @@ const beakerBrowserManifest = require('./manifests/internal/browser')
 const downloadsManifest = require('./manifests/internal/downloads')
 const historyManifest = require('./manifests/internal/history')
 const sitedataManifest = require('./manifests/internal/sitedata')
-const domainNamesManifest = require('./manifests/internal/domain-names')
 const watchlistManifest = require('./manifests/internal/watchlist')
 const templatesManifest = require('./manifests/internal/templates')
 const crawlerManifest = require('./manifests/internal/crawler')
@@ -19,7 +18,6 @@ const loggerAPI = require('../logger').WEBAPI
 const archivesAPI = require('./bg/archives')
 const historyAPI = require('./bg/history')
 const sitedataAPI = require('../dbs/sitedata').WEBAPI
-const domainNamesAPI = require('../dbs/domain-names')
 const watchlistAPI = require('./bg/watchlist')
 const templatesAPI = require('./bg/templates')
 const crawlerAPI = require('../crawler').WEBAPI
@@ -65,7 +63,6 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('downloads', downloadsManifest, globals.downloadsWebAPI, internalOnly)
   globals.rpcAPI.exportAPI('history', historyManifest, historyAPI, internalOnly)
   globals.rpcAPI.exportAPI('sitedata', sitedataManifest, sitedataAPI, internalOnly)
-  globals.rpcAPI.exportAPI('domain-names', domainNamesManifest, domainNamesAPI, internalOnly)
   globals.rpcAPI.exportAPI('watchlist', watchlistManifest, watchlistAPI, internalOnly)
   globals.rpcAPI.exportAPI('templates', templatesManifest, templatesAPI, internalOnly)
   globals.rpcAPI.exportAPI('crawler', crawlerManifest, crawlerAPI, internalOnly)
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index fa29838b..114f31ce 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -7,7 +7,6 @@ const beakerBrowserManifest = require('../manifests/internal/browser')
 const downloadsManifest = require('../manifests/internal/downloads')
 const historyManifest = require('../manifests/internal/history')
 const sitedataManifest = require('../manifests/internal/sitedata')
-const domainNamesManifest = require('../manifests/internal/domain-names')
 const watchlistManifest = require('../manifests/internal/watchlist')
 const templatesManifest = require('../manifests/internal/templates')
 const crawlerManifest = require('../manifests/internal/crawler')
@@ -24,7 +23,6 @@ exports.setup = function (rpc) {
     const downloadsRPC = rpc.importAPI('downloads', downloadsManifest, opts)
     const historyRPC = rpc.importAPI('history', historyManifest, opts)
     const sitedataRPC = rpc.importAPI('sitedata', sitedataManifest, opts)
-    const domainNamesRPC = rpc.importAPI('domain-names', domainNamesManifest, opts)
     const watchlistRPC = rpc.importAPI('watchlist', watchlistManifest, opts)
     const templatesRPC = rpc.importAPI('templates', templatesManifest, opts)
     const crawlerRPC = rpc.importAPI('crawler', crawlerManifest, opts)
@@ -138,14 +136,6 @@ exports.setup = function (rpc) {
     beaker.sitedata.clearPermission = sitedataRPC.clearPermission
     beaker.sitedata.clearPermissionAllOrigins = sitedataRPC.clearPermissionAllOrigins
 
-    // beaker.domainNames
-    beaker.domainNames = {
-      set: domainNamesRPC.set,
-      delete: domainNamesRPC.delete,
-      get: domainNamesRPC.get,
-      list: domainNamesRPC.list
-    }
-
     // beaker.watchlist
     beaker.watchlist = {}
     beaker.watchlist.add = watchlistRPC.add
diff --git a/web-apis/manifests/internal/domain-names.js b/web-apis/manifests/internal/domain-names.js
deleted file mode 100644
index a19a931d..00000000
--- a/web-apis/manifests/internal/domain-names.js
+++ /dev/null
@@ -1,6 +0,0 @@
-module.exports = {
-  set: 'promise',
-  delete: 'promise',
-  get: 'promise',
-  list: 'promise'
-}
\ No newline at end of file

From c6d04459ae78b155d4ec8ca0d3d089c727b49024 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 6 Mar 2019 11:31:47 -0600
Subject: [PATCH 113/245] Markdown styles update: centering

---
 lib/markdown.js | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/lib/markdown.js b/lib/markdown.js
index 4f4f53c8..d56d0248 100644
--- a/lib/markdown.js
+++ b/lib/markdown.js
@@ -33,7 +33,8 @@ exports.render = function (nav, content) {
       }
       main {
         flex: 1;
-        max-width: 750px;
+        max-width: 860px;
+        margin: 0 auto;
       }
       nav {
         max-width: 200px;
@@ -41,6 +42,11 @@ exports.render = function (nav, content) {
         overflow: hidden;
         margin: 0.5em 0;
       }
+      @media (min-width: 1300px) {
+        nav {
+          position: fixed; /* on wide screens, dont cause the <main> to be offset at all */
+        }
+      }
       hr {
         border: 0;
         border-top: 1px solid #ccc;

From c1de984271128a92856c15c9fda08286c8aa2dd7 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 11 Mar 2019 18:32:07 -0500
Subject: [PATCH 114/245] Handle hostnames in the archives and library web apis

---
 dat/library.js          |  8 +++++---
 web-apis/bg/archives.js | 38 +++++++++++++++++++-------------------
 web-apis/bg/library.js  | 10 +++++-----
 3 files changed, 29 insertions(+), 27 deletions(-)

diff --git a/dat/library.js b/dat/library.js
index 5ea4add7..e48c30d7 100644
--- a/dat/library.js
+++ b/dat/library.js
@@ -540,7 +540,7 @@ exports.clearFileCache = async function clearFileCache (key) {
 // helpers
 // =
 
-const fromURLToKey = exports.fromURLToKey = function fromURLToKey (url) {
+const fromURLToKey = exports.fromURLToKey = function fromURLToKey (url, lookupDns = false) {
   if (Buffer.isBuffer(url)) {
     return url
   }
@@ -556,8 +556,10 @@ const fromURLToKey = exports.fromURLToKey = function fromURLToKey (url) {
     throw new InvalidURLError('URL must be a dat: scheme')
   }
   if (!DAT_HASH_REGEX.test(urlp.host)) {
-    // TODO- support dns lookup?
-    throw new InvalidURLError('Hostname is not a valid hash')
+    if (!lookupDns) {
+      throw new InvalidURLError('Hostname is not a valid hash')
+    }
+    return require('./dns').resolveName(urlp.host)
   }
 
   return urlp.host
diff --git a/web-apis/bg/archives.js b/web-apis/bg/archives.js
index aee18343..0a877bcd 100644
--- a/web-apis/bg/archives.js
+++ b/web-apis/bg/archives.js
@@ -35,12 +35,12 @@ module.exports = {
   // =
 
   async setUserSettings (url, opts) {
-    var key = datLibrary.fromURLToKey(url)
+    var key = await datLibrary.fromURLToKey(url, true)
     return archivesDb.setUserSettings(0, key, opts)
   },
 
   async add (url, opts = {}) {
-    var key = datLibrary.fromURLToKey(url)
+    var key = await datLibrary.fromURLToKey(url, true)
 
     // pull metadata
     var archive = await datLibrary.getOrLoadArchive(key)
@@ -52,7 +52,7 @@ module.exports = {
   },
 
   async remove (url) {
-    var key = datLibrary.fromURLToKey(url)
+    var key = await datLibrary.fromURLToKey(url, true)
     return archivesDb.setUserSettings(0, key, {isSaved: false})
   },
 
@@ -65,7 +65,7 @@ module.exports = {
     }
 
     for (var i = 0; i < urls.length; i++) {
-      let key = datLibrary.fromURLToKey(urls[i])
+      let key = await datLibrary.fromURLToKey(urls[i], true)
 
       results.push(await archivesDb.setUserSettings(0, key, {isSaved: false}))
     }
@@ -73,7 +73,7 @@ module.exports = {
   },
 
   async delete (url) {
-    const key = datLibrary.fromURLToKey(url)
+    const key = await datLibrary.fromURLToKey(url, true)
     const drafts = await archiveDraftsDb.list(0, key)
     const toDelete = [{key}].concat(drafts)
     var bytes = 0
@@ -93,7 +93,7 @@ module.exports = {
   // =
 
   async validateLocalSyncPath (key, localSyncPath) {
-    key = datLibrary.fromURLToKey(key)
+    key = await datLibrary.fromURLToKey(key, true)
     localSyncPath = path.normalize(localSyncPath)
 
     // make sure the path is good
@@ -118,7 +118,7 @@ module.exports = {
   },
 
   async setLocalSyncPath (key, localSyncPath, opts = {}) {
-    key = datLibrary.fromURLToKey(key)
+    key = await datLibrary.fromURLToKey(key, true)
     localSyncPath = localSyncPath ? path.normalize(localSyncPath) : null
 
     // disable path
@@ -162,7 +162,7 @@ module.exports = {
   },
 
   async ensureLocalSyncFinished (key) {
-    key = datLibrary.fromURLToKey(key)
+    key = await datLibrary.fromURLToKey(key, true)
 
     // load the archive
     var archive
@@ -179,7 +179,7 @@ module.exports = {
   // =
 
   async diffLocalSyncPathListing (key, opts) {
-    key = datLibrary.fromURLToKey(key)
+    key = await datLibrary.fromURLToKey(key, true)
 
     // load the archive
     var archive
@@ -192,7 +192,7 @@ module.exports = {
   },
 
   async diffLocalSyncPathFile (key, filepath) {
-    key = datLibrary.fromURLToKey(key)
+    key = await datLibrary.fromURLToKey(key, true)
 
     // load the archive
     var archive
@@ -205,7 +205,7 @@ module.exports = {
   },
 
   async publishLocalSyncPathListing (key, opts = {}) {
-    key = datLibrary.fromURLToKey(key)
+    key = await datLibrary.fromURLToKey(key, true)
 
     // load the archive
     var archive
@@ -219,7 +219,7 @@ module.exports = {
   },
 
   async revertLocalSyncPathListing (key, opts = {}) {
-    key = datLibrary.fromURLToKey(key)
+    key = await datLibrary.fromURLToKey(key, true)
 
     // load the archive
     var archive
@@ -236,7 +236,7 @@ module.exports = {
   // =
 
   async getDraftInfo (url) {
-    var key = datLibrary.fromURLToKey(url)
+    var key = await datLibrary.fromURLToKey(url, true)
     var masterKey = await archiveDraftsDb.getMaster(0, key)
     var master = await archivesDb.query(0, {key: masterKey})
     var drafts = await archiveDraftsDb.list(0, masterKey)
@@ -244,13 +244,13 @@ module.exports = {
   },
 
   async listDrafts (masterUrl) {
-    var masterKey = datLibrary.fromURLToKey(masterUrl)
+    var masterKey = await datLibrary.fromURLToKey(masterUrl, true)
     return archiveDraftsDb.list(0, masterKey)
   },
 
   async addDraft (masterUrl, draftUrl) {
-    var masterKey = datLibrary.fromURLToKey(masterUrl)
-    var draftKey = datLibrary.fromURLToKey(draftUrl)
+    var masterKey = await datLibrary.fromURLToKey(masterUrl, true)
+    var draftKey = await datLibrary.fromURLToKey(draftUrl, true)
 
     // make sure we're modifying the master
     masterKey = await archiveDraftsDb.getMaster(0, masterKey)
@@ -259,8 +259,8 @@ module.exports = {
   },
 
   async removeDraft (masterUrl, draftUrl) {
-    var masterKey = datLibrary.fromURLToKey(masterUrl)
-    var draftKey = datLibrary.fromURLToKey(draftUrl)
+    var masterKey = await datLibrary.fromURLToKey(masterUrl, true)
+    var draftKey = await datLibrary.fromURLToKey(draftUrl, true)
 
     // make sure we're modifying the master
     masterKey = await archiveDraftsDb.getMaster(0, masterKey)
@@ -276,7 +276,7 @@ module.exports = {
   },
 
   async clearFileCache (url) {
-    return datLibrary.clearFileCache(datLibrary.fromURLToKey(url))
+    return datLibrary.clearFileCache(await datLibrary.fromURLToKey(url, true))
   },
 
   async clearGarbage ({isOwner} = {}) {
diff --git a/web-apis/bg/library.js b/web-apis/bg/library.js
index 34d1f3bb..c4dc009e 100644
--- a/web-apis/bg/library.js
+++ b/web-apis/bg/library.js
@@ -47,7 +47,7 @@ const {PermissionsError} = require('beaker-error-constants')
 function add (isRequest) {
   return async function (url, opts) {
     await assertPermission(this.sender, 'dangerousAppControl')
-    var key = datLibrary.fromURLToKey(url)
+    var key = await datLibrary.fromURLToKey(url, true)
     if (opts && 'localPath' in opts) await validateLocalPath(key, opts.localPath)
     if (opts && 'preview' in opts) validatePreview(opts.preview)
 
@@ -70,7 +70,7 @@ function add (isRequest) {
 function remove (isRequest) {
   return async function (url) {
     await assertPermission(this.sender, 'dangerousAppControl')
-    var key = datLibrary.fromURLToKey(url)
+    var key = await datLibrary.fromURLToKey(url, true)
 
     if (isRequest) {
       await checkIsntOwner(key)
@@ -120,7 +120,7 @@ module.exports = {
    */
   async get (url) {
     await assertPermission(this.sender, 'dangerousAppControl')
-    var key = datLibrary.fromURLToKey(url)
+    var key = await datLibrary.fromURLToKey(url, true)
     var archive = /** @type LibraryArchiveRecord */(await datLibrary.queryArchives({key}))
     if (archive) {
       return massageArchiveRecord(archive)
@@ -154,7 +154,7 @@ module.exports = {
    */
   async edit (url, opts) {
     await assertPermission(this.sender, 'dangerousAppControl')
-    var key = datLibrary.fromURLToKey(url)
+    var key = await datLibrary.fromURLToKey(url, true)
     if (opts && 'localPath' in opts) await validateLocalPath(key, opts.localPath)
     if (opts && 'preview' in opts) validatePreview(opts.preview)
 
@@ -183,7 +183,7 @@ module.exports = {
    */
   async uncache (url) {
     await assertPermission(this.sender, 'dangerousAppControl')
-    await datLibrary.clearFileCache(datLibrary.fromURLToKey(url))
+    await datLibrary.clearFileCache(await datLibrary.fromURLToKey(url, true))
   },
 
   async createEventStream () {

From e541e44a3e6d5ffdc8178913d95a8a9b4d30997a Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 12 Mar 2019 09:07:12 -0500
Subject: [PATCH 115/245] Rename .preview to .previewEnabled in library API

---
 web-apis/bg/library.js | 20 ++++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/web-apis/bg/library.js b/web-apis/bg/library.js
index c4dc009e..6f813757 100644
--- a/web-apis/bg/library.js
+++ b/web-apis/bg/library.js
@@ -20,7 +20,7 @@ const {PermissionsError} = require('beaker-error-constants')
  * @prop {number} connections
  * @prop {boolean} owner
  * @prop {boolean} saved
- * @prop {boolean} preview
+ * @prop {boolean} previewEnabled
  * @prop {string} localPath
  *
  * @typedef {Object} LibraryPublicAPIAddedEventDetail
@@ -49,7 +49,7 @@ function add (isRequest) {
     await assertPermission(this.sender, 'dangerousAppControl')
     var key = await datLibrary.fromURLToKey(url, true)
     if (opts && 'localPath' in opts) await validateLocalPath(key, opts.localPath)
-    if (opts && 'preview' in opts) validatePreview(opts.preview)
+    if (opts && 'previewEnabled' in opts) validatePreview(opts.previewEnabled)
 
     if (isRequest) {
       await checkIsntOwner(key)
@@ -62,7 +62,7 @@ function add (isRequest) {
     // update settings
     var settings = {isSaved: true}
     if (opts && 'localPath' in opts) settings.localSyncPath = opts.localPath
-    if (opts && 'preview' in opts) settings.previewMode = opts.preview
+    if (opts && 'previewEnabled' in opts) settings.previewMode = opts.previewEnabled
     await archivesDb.setUserSettings(0, key, settings)
   }
 }
@@ -131,7 +131,7 @@ module.exports = {
    * @param {string} url
    * @param {Object} [opts]
    * @param {string} [opts.localPath]
-   * @param {boolean} [opts.preview]
+   * @param {boolean} [opts.previewEnabled]
    * @returns {Promise<void>}
    */
   add: add(false),
@@ -140,7 +140,7 @@ module.exports = {
    * @param {string} url
    * @param {Object} [opts]
    * @param {string} [opts.localPath]
-   * @param {boolean} [opts.preview]
+   * @param {boolean} [opts.previewEnabled]
    * @returns {Promise<void>}
    */
   requestAdd: add(true),
@@ -149,19 +149,19 @@ module.exports = {
    * @param {string} url
    * @param {Object} [opts]
    * @param {string} [opts.localPath]
-   * @param {boolean} [opts.preview]
+   * @param {boolean} [opts.previewEnabled]
    * @returns {Promise<void>}
    */
   async edit (url, opts) {
     await assertPermission(this.sender, 'dangerousAppControl')
     var key = await datLibrary.fromURLToKey(url, true)
     if (opts && 'localPath' in opts) await validateLocalPath(key, opts.localPath)
-    if (opts && 'preview' in opts) validatePreview(opts.preview)
+    if (opts && 'previewEnabled' in opts) validatePreview(opts.previewEnabled)
 
     // update settings
     var settings = {}
     if (opts && 'localPath' in opts) settings.localSyncPath = opts.localPath
-    if (opts && 'preview' in opts) settings.previewMode = opts.preview
+    if (opts && 'previewEnabled' in opts) settings.previewMode = opts.previewEnabled
     await archivesDb.setUserSettings(0, key, settings)
   },
 
@@ -255,7 +255,7 @@ function validateSavedFilter (v) {
 
 function validatePreview (v) {
   if (typeof v === 'boolean') return
-  throw new Error('The `preview` option must be a boolean')
+  throw new Error('The `previewEnabled` option must be a boolean')
 }
 
 async function validateLocalPath (key, v) {
@@ -302,7 +302,7 @@ function massageArchiveRecord (a) {
     connections: a.peers, // .peers is attached by library.js
     owner: a.isOwner,
     saved: a.userSettings.isSaved,
-    preview: a.userSettings.previewMode,
+    previewEnabled: a.userSettings.previewMode,
     localPath: a.userSettings.localSyncPath
   }
 }

From d5af82bc2509c86b339eb5402e8788df62d2cabd Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 12 Mar 2019 09:29:32 -0500
Subject: [PATCH 116/245] Return a post object in the feed.addPost and
 .editPost web apis

---
 crawler/feed.js                     | 12 ++++++----
 web-apis/bg/unwalled-garden-feed.js | 37 +++++++++++++++++++----------
 2 files changed, 31 insertions(+), 18 deletions(-)

diff --git a/crawler/feed.js b/crawler/feed.js
index f3abac9c..165139f3 100644
--- a/crawler/feed.js
+++ b/crawler/feed.js
@@ -230,7 +230,7 @@ const getPost = exports.getPost = async function (url) {
         AND src.url = ?
       WHERE
         crawl_posts.pathname = ?
-  `, [urlParsed.origin, urlParsed.pathname]))
+  `, [`${urlParsed.protocol}//${urlParsed.hostname}`, urlParsed.pathname]))
 }
 
 /**
@@ -240,21 +240,23 @@ const getPost = exports.getPost = async function (url) {
  * @param {InternalDatArchive} archive - where to write the post to.
  * @param {Object} content
  * @param {string} content.body
- * @returns {Promise}
+ * @returns {Promise<string>} url
  */
 exports.addPost = async function (archive, content) {
   var valid = validatePostContent(content)
   if (!valid) throw ajv.errorsText(validatePostContent.errors)
 
   var filename = generateTimeFilename()
+  var filepath = `/data/feed/${filename}.json`
   await ensureDirectory(archive, '/data')
   await ensureDirectory(archive, '/data/feed')
-  await archive.pda.writeFile(`/data/feed/${filename}.json`, JSON.stringify({
+  await archive.pda.writeFile(filepath, JSON.stringify({
     type: JSON_TYPE,
     content,
     createdAt: (new Date()).toISOString()
   }, null, 2))
   await crawler.crawlSite(archive)
+  return archive.url + filepath
 }
 
 /**
@@ -265,7 +267,7 @@ exports.addPost = async function (archive, content) {
  * @param {string} pathname - the pathname of the post.
  * @param {Object} content
  * @param {string} content.body
- * @returns {Promise}
+ * @returns {Promise<void>}
  */
 exports.editPost = async function (archive, pathname, content) {
   var valid = validatePostContent(content)
@@ -286,7 +288,7 @@ exports.editPost = async function (archive, pathname, content) {
  *
  * @param {InternalDatArchive} archive - where to write the post to.
  * @param {string} pathname - the pathname of the post.
- * @returns {Promise}
+ * @returns {Promise<void>}
  */
 exports.deletePost = async function (archive, pathname) {
   assert(typeof pathname === 'string', 'Delete() must be provided a valid URL string')
diff --git a/web-apis/bg/unwalled-garden-feed.js b/web-apis/bg/unwalled-garden-feed.js
index e81b5b17..6dd6c5d2 100644
--- a/web-apis/bg/unwalled-garden-feed.js
+++ b/web-apis/bg/unwalled-garden-feed.js
@@ -70,7 +70,7 @@ module.exports = {
    * @param {Object} post
    * @param {Object} post.content
    * @param {string} post.content.body
-   * @returns {Promise<void>}
+   * @returns {Promise<FeedPostPublicAPIRecord>}
    */
   async addPost (post) {
     await assertPermission(this.sender, 'dangerousAppControl')
@@ -83,7 +83,8 @@ module.exports = {
     if (!userSession) throw new Error('No active user session')
 
     var userArchive = dat.library.getArchive(userSession.url)
-    await feedCrawler.addPost(userArchive, post.content)
+    var url = await feedCrawler.addPost(userArchive, post.content)
+    return massagePostRecord(await feedCrawler.getPost(url))
   },
 
   /**
@@ -91,7 +92,7 @@ module.exports = {
    * @param {Object} post
    * @param {Object} post.content
    * @param {string} post.content.body
-   * @returns {Promise<void>}
+   * @returns {Promise<FeedPostPublicAPIRecord>}
    */
   async editPost (url, post) {
     await assertPermission(this.sender, 'dangerousAppControl')
@@ -103,10 +104,11 @@ module.exports = {
 
     var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
-    url = urlToPathname(url)
+    var filepath = await urlToFilepath(url, userSession.url)
 
     var userArchive = dat.library.getArchive(userSession.url)
-    await feedCrawler.editPost(userArchive, url, post.content)
+    await feedCrawler.editPost(userArchive, filepath, post.content)
+    return massagePostRecord(await feedCrawler.getPost(userSession.url + filepath))
   },
 
   /**
@@ -120,10 +122,10 @@ module.exports = {
 
     var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
-    url = urlToPathname(url)
+    var filepath = await urlToFilepath(url, userSession.url)
 
     var userArchive = dat.library.getArchive(userSession.url)
-    await feedCrawler.deletePost(userArchive, url)
+    await feedCrawler.deletePost(userArchive, filepath)
   }
 }
 
@@ -141,17 +143,26 @@ async function assertPermission (sender, perm) {
 /**
  * Tries to parse the URL and return the pathname. If fails, assumes the string was a pathname.
  * @param {string} url
- * @returns {string}
+ * @returns {Promise<string>}
  */
-function urlToPathname (url) {
+async function urlToFilepath (url, origin) {
+  var filepath
   try {
-    var urlParsed = new URL(url)
-    if (urlParsed.pathname && urlParsed.pathname !== '/') {
-      return urlParsed.pathname
+    // if `url` is a full URL, extract the path
+    var urlp = new URL(url)
+    filepath = urlp.pathname
+    
+    // double-check the origin
+    var key = dat.dns.resolveName(urlp.hostname)
+    var urlp2 = new URL(origin)
+    if (key !== urlp2.hostname) {
+      throw new Error('Unable to edit posts on other sites than your own')
     }
   } catch (e) {
-    return url
+    // assume `url` is a path
+    filepath = url
   }
+  return filepath
 }
 
 function massagePostRecord (post) {

From 3e9cdefb07313700564a4786089e501f6e22f4d0 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 12 Mar 2019 09:34:45 -0500
Subject: [PATCH 117/245] Fix url handling in feed edit/delete apis

---
 web-apis/bg/unwalled-garden-feed.js | 21 ++++++++++++---------
 1 file changed, 12 insertions(+), 9 deletions(-)

diff --git a/web-apis/bg/unwalled-garden-feed.js b/web-apis/bg/unwalled-garden-feed.js
index 6dd6c5d2..8f2908b0 100644
--- a/web-apis/bg/unwalled-garden-feed.js
+++ b/web-apis/bg/unwalled-garden-feed.js
@@ -105,6 +105,7 @@ module.exports = {
     var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
     var filepath = await urlToFilepath(url, userSession.url)
+    console.log('got filepath', url, filepath)
 
     var userArchive = dat.library.getArchive(userSession.url)
     await feedCrawler.editPost(userArchive, filepath, post.content)
@@ -146,22 +147,24 @@ async function assertPermission (sender, perm) {
  * @returns {Promise<string>}
  */
 async function urlToFilepath (url, origin) {
+  var urlp
   var filepath
   try {
     // if `url` is a full URL, extract the path
-    var urlp = new URL(url)
+    urlp = new URL(url)
     filepath = urlp.pathname
-    
-    // double-check the origin
-    var key = dat.dns.resolveName(urlp.hostname)
-    var urlp2 = new URL(origin)
-    if (key !== urlp2.hostname) {
-      throw new Error('Unable to edit posts on other sites than your own')
-    }
   } catch (e) {
     // assume `url` is a path
-    filepath = url
+    return url
+  }
+
+  // double-check the origin
+  var key = await dat.dns.resolveName(urlp.hostname)
+  var urlp2 = new URL(origin)
+  if (key !== urlp2.hostname) {
+    throw new Error('Unable to edit posts on other sites than your own')
   }
+
   return filepath
 }
 

From 96bbca2cd190ae59669f8909fa85746551af03aa Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 12 Mar 2019 09:42:58 -0500
Subject: [PATCH 118/245] Fix: Correctly lookup updated posts in the feed
 crawler

---
 crawler/feed.js | 17 ++++++++++++++++-
 1 file changed, 16 insertions(+), 1 deletion(-)

diff --git a/crawler/feed.js b/crawler/feed.js
index 165139f3..e8c5e6c4 100644
--- a/crawler/feed.js
+++ b/crawler/feed.js
@@ -119,7 +119,7 @@ exports.crawlSite = async function (archive, crawlSource) {
         if (isNaN(post.updatedAt)) post.updatedAt = 0 // optional
 
         // upsert
-        let existingPost = await getPost(archive.url, changedPost.name)
+        let existingPost = await getPost(joinPath(archive.url, changedPost.name))
         if (existingPost) {
           await db.run(`
             UPDATE crawl_posts
@@ -312,6 +312,21 @@ function toAuthorOrigin (url) {
   }
 }
 
+/**
+ * @param {string} origin 
+ * @param {string} pathname
+ * @returns {string}
+ */
+function joinPath (origin, pathname) {
+  if (origin.endsWith('/') && pathname.startsWith('/')) {
+    return origin + pathname.slice(1)
+  }
+  if (!origin.endsWith('/') && !pathname.startsWith('/')) {
+    return origin + '/' + pathname
+  }
+  return origin + pathname
+}
+
 /**
  * @param {Object} row
  * @returns {Promise<Post>}

From 3027a2c332d9feed62df5d5f7f860d4c8a4311fd Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 12 Mar 2019 17:11:34 -0500
Subject: [PATCH 119/245] Improve handling of notfound archives

---
 crawler/feed.js         | 2 +-
 dat/library.js          | 1 +
 web-apis/bg/profiles.js | 2 +-
 3 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/crawler/feed.js b/crawler/feed.js
index e8c5e6c4..00a23e41 100644
--- a/crawler/feed.js
+++ b/crawler/feed.js
@@ -313,7 +313,7 @@ function toAuthorOrigin (url) {
 }
 
 /**
- * @param {string} origin 
+ * @param {string} origin
  * @param {string} pathname
  * @returns {string}
  */
diff --git a/dat/library.js b/dat/library.js
index e48c30d7..aae67e51 100644
--- a/dat/library.js
+++ b/dat/library.js
@@ -470,6 +470,7 @@ exports.updateSizeTracking = function updateSizeTracking (archive) {
 exports.queryArchives = async function queryArchives (query) {
   // run the query
   var archiveInfos = await archivesDb.query(0, query)
+  if (!archiveInfos) return undefined
   var isArray = Array.isArray(archiveInfos)
   if (!isArray) archiveInfos = [archiveInfos]
 
diff --git a/web-apis/bg/profiles.js b/web-apis/bg/profiles.js
index 837cab50..5d53551c 100644
--- a/web-apis/bg/profiles.js
+++ b/web-apis/bg/profiles.js
@@ -19,7 +19,7 @@ const {PermissionsError} = require('beaker-error-constants')
 // =
 
 async function get (url) {
-  var key = datLibrary.fromURLToKey(url)
+  var key = await datLibrary.fromURLToKey(url, true)
   var archive = /** @type LibraryArchiveRecord */(await datLibrary.queryArchives({key}))
   if (!archive) return null
   return {

From b5049360c9e97e69ce0540e2a6f6fa3b236b1660 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 12 Mar 2019 17:30:55 -0500
Subject: [PATCH 120/245] Add .index() to profiles web api

---
 crawler/index.js                        |  3 +++
 web-apis/bg/profiles.js                 | 11 +++++++++++
 web-apis/manifests/external/profiles.js |  1 +
 3 files changed, 15 insertions(+)

diff --git a/crawler/index.js b/crawler/index.js
index a50bb39e..5d99e30b 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -65,6 +65,9 @@ exports.unwatchSite = async function (url) {
 
 const crawlSite =
 exports.crawlSite = async function (archive) {
+  if (typeof archive === 'string') {
+    archive = await dat.library.getOrLoadArchive(archive)
+  }
   logger.silly('Crawling site', {details: {url: archive.url}})
   crawlerEvents.emit('crawl-start', {sourceUrl: archive.url})
   var release = await lock('crawl:' + archive.url)
diff --git a/web-apis/bg/profiles.js b/web-apis/bg/profiles.js
index 5d53551c..4c932614 100644
--- a/web-apis/bg/profiles.js
+++ b/web-apis/bg/profiles.js
@@ -1,5 +1,6 @@
 const globals = require('../../globals')
 const datLibrary = require('../../dat/library')
+const crawler = require('../../crawler')
 const {PermissionsError} = require('beaker-error-constants')
 
 // typedefs
@@ -50,6 +51,16 @@ module.exports = {
     return get(url)
   },
 
+  /**
+   * @param {string} url
+   * @returns {Promise<ProfilesPublicAPIRecord>}
+   */
+  async index (url) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    await crawler.crawlSite(url)
+    return get(url)
+  },
+
   /**
    * @returns {Promise<ProfilesPublicAPIRecord>}
    */
diff --git a/web-apis/manifests/external/profiles.js b/web-apis/manifests/external/profiles.js
index 0a1e7811..fb88fd8a 100644
--- a/web-apis/manifests/external/profiles.js
+++ b/web-apis/manifests/external/profiles.js
@@ -1,5 +1,6 @@
 module.exports = {
   getCurrentUser: 'promise',
   get: 'promise',
+  index: 'promise',
   openProfileEditor: 'promise'
 }
\ No newline at end of file

From 551a1c0d4856a01cd004ad738c8d66514428f0e6 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 13 Mar 2019 09:50:31 -0500
Subject: [PATCH 121/245] Normalize the url returned by the profiles web api

---
 web-apis/bg/profiles.js | 11 ++++++++++-
 1 file changed, 10 insertions(+), 1 deletion(-)

diff --git a/web-apis/bg/profiles.js b/web-apis/bg/profiles.js
index 4c932614..24f92777 100644
--- a/web-apis/bg/profiles.js
+++ b/web-apis/bg/profiles.js
@@ -24,7 +24,7 @@ async function get (url) {
   var archive = /** @type LibraryArchiveRecord */(await datLibrary.queryArchives({key}))
   if (!archive) return null
   return {
-    url,
+    url: toOrigin(url),
     title: archive.title,
     description: archive.description,
     type: archive.type
@@ -81,3 +81,12 @@ async function assertPermission (sender, perm) {
   if (await globals.permsAPI.requestPermission(perm, sender)) return true
   throw new PermissionsError()
 }
+
+function toOrigin (url) {
+  try {
+    let urlp = new URL(url)
+    return `${urlp.protocol}//${urlp.hostname}`
+  } catch (e) {
+    return url
+  }
+}
\ No newline at end of file

From e16ecfe46ee7df7c19a40892fb2f8dd767ce0c4f Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 14 Mar 2019 14:51:35 -0500
Subject: [PATCH 122/245] Remove profiles.openProfileEditor web api

---
 web-apis/bg/profiles.js                 | 12 ------------
 web-apis/manifests/external/profiles.js |  3 +--
 2 files changed, 1 insertion(+), 14 deletions(-)

diff --git a/web-apis/bg/profiles.js b/web-apis/bg/profiles.js
index 24f92777..c8b703db 100644
--- a/web-apis/bg/profiles.js
+++ b/web-apis/bg/profiles.js
@@ -59,18 +59,6 @@ module.exports = {
     await assertPermission(this.sender, 'dangerousAppControl')
     await crawler.crawlSite(url)
     return get(url)
-  },
-
-  /**
-   * @returns {Promise<ProfilesPublicAPIRecord>}
-   */
-  async openProfileEditor () {
-    await assertPermission(this.sender, 'dangerousAppControl')
-    var sess = globals.userSessionAPI.getFor(this.sender)
-    if (!sess) return null
-    var user = await get(sess.url)
-    await globals.userSessionAPI.openProfileEditor(this.sender, user)
-    return get(sess.url)
   }
 }
 
diff --git a/web-apis/manifests/external/profiles.js b/web-apis/manifests/external/profiles.js
index fb88fd8a..09633e67 100644
--- a/web-apis/manifests/external/profiles.js
+++ b/web-apis/manifests/external/profiles.js
@@ -1,6 +1,5 @@
 module.exports = {
   getCurrentUser: 'promise',
   get: 'promise',
-  index: 'promise',
-  openProfileEditor: 'promise'
+  index: 'promise'
 }
\ No newline at end of file

From 8c875ea0e250441811231ea6f3e6cf11214a0085 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 15 Mar 2019 13:36:31 -0500
Subject: [PATCH 123/245] Remove the twitter and explore default bookmarks

---
 dbs/schemas/profile-data.sql.js | 2 --
 1 file changed, 2 deletions(-)

diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index ddff4bf9..564b087b 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -248,11 +248,9 @@ INSERT INTO profiles (id) VALUES (0);
 -- default bookmarks
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker Home', 'dat://beakerbrowser.com', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Dat Project', 'dat://datproject.org', 1);
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, '@BeakerBrowser', 'https://twitter.com/beakerbrowser', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Hashbase', 'https://hashbase.io', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Documentation', 'dat://beakerbrowser.com/docs', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Report an issue', 'https://github.com/beakerbrowser/beaker/issues', 1);
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Explore the p2p Web', 'dat://taravancil.com/explore-the-p2p-web.md', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker', 'https://opencollective.com/beaker', 1);
 
 PRAGMA user_version = 24;

From 71794a78cd30649d280f55880b27931162214c49 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 17 Mar 2019 15:42:45 -0500
Subject: [PATCH 124/245] Dont pin default bookmarks

---
 dbs/schemas/profile-data.sql.js    | 12 ++++++------
 dbs/schemas/profile-data.v1.sql.js | 14 ++++++--------
 2 files changed, 12 insertions(+), 14 deletions(-)

diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index 564b087b..e29774bc 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -246,12 +246,12 @@ CREATE TABLE workspaces (
 INSERT INTO profiles (id) VALUES (0);
 
 -- default bookmarks
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker Home', 'dat://beakerbrowser.com', 1);
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Dat Project', 'dat://datproject.org', 1);
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Hashbase', 'https://hashbase.io', 1);
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Documentation', 'dat://beakerbrowser.com/docs', 1);
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Report an issue', 'https://github.com/beakerbrowser/beaker/issues', 1);
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker', 'https://opencollective.com/beaker', 1);
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker Home', 'dat://beakerbrowser.com', 0);
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Dat Project', 'dat://datproject.org', 0);
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Hashbase', 'https://hashbase.io', 0);
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Documentation', 'dat://beakerbrowser.com/docs', 0);
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Report an issue', 'https://github.com/beakerbrowser/beaker/issues', 0);
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker', 'https://opencollective.com/beaker', 0);
 
 PRAGMA user_version = 24;
 `
diff --git a/dbs/schemas/profile-data.v1.sql.js b/dbs/schemas/profile-data.v1.sql.js
index 242c26ed..0bc66e2d 100644
--- a/dbs/schemas/profile-data.v1.sql.js
+++ b/dbs/schemas/profile-data.v1.sql.js
@@ -59,14 +59,12 @@ CREATE UNIQUE INDEX visits_stats_url ON visit_stats (url);
 INSERT INTO profiles (id) VALUES (0);
 
 -- default bookmarks
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker Home', 'dat://beakerbrowser.com', 1);
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Dat Project', 'dat://datproject.org', 1);
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, '@BeakerBrowser', 'https://twitter.com/beakerbrowser', 1);
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Hashbase', 'https://hashbase.io', 1);
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Documentation', 'dat://beakerbrowser.com/docs', 1);
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Report an issue', 'https://github.com/beakerbrowser/beaker/issues', 1);
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Explore the p2p Web', 'dat://taravancil.com/explore-the-p2p-web.md', 1);
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker', 'https://opencollective.com/beaker', 1);
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker Home', 'dat://beakerbrowser.com', 0);
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Dat Project', 'dat://datproject.org', 0);
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Hashbase', 'https://hashbase.io', 0);
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Documentation', 'dat://beakerbrowser.com/docs', 0);
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Report an issue', 'https://github.com/beakerbrowser/beaker/issues', 0);
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker', 'https://opencollective.com/beaker', 0);
 
 PRAGMA user_version = 1;
 `

From e387cebbc2b30b11670ac381a24088f40e1a7938 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 18 Mar 2019 10:58:29 -0500
Subject: [PATCH 125/245] Tweak some type annotations

---
 web-apis/bg/unwalled-garden-feed.js        | 2 +-
 web-apis/bg/unwalled-garden-followgraph.js | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/web-apis/bg/unwalled-garden-feed.js b/web-apis/bg/unwalled-garden-feed.js
index 8f2908b0..63ec5467 100644
--- a/web-apis/bg/unwalled-garden-feed.js
+++ b/web-apis/bg/unwalled-garden-feed.js
@@ -13,7 +13,7 @@ const feedCrawler = require('../../crawler/feed')
  * @prop {string} url
  * @prop {string} title
  * @prop {string} description
- * @prop {Array<string>} type
+ * @prop {string[]} type
  *
  * @typedef {Object} FeedPostPublicAPIRecord
  * @prop {string} url
diff --git a/web-apis/bg/unwalled-garden-followgraph.js b/web-apis/bg/unwalled-garden-followgraph.js
index 6771fb9d..beffa961 100644
--- a/web-apis/bg/unwalled-garden-followgraph.js
+++ b/web-apis/bg/unwalled-garden-followgraph.js
@@ -13,7 +13,7 @@ const followgraphCrawler = require('../../crawler/followgraph')
  * @prop {string} url
  * @prop {string} title
  * @prop {string} description
- * @prop {Array<string>} type
+ * @prop {string[]} type
  */
 
 // exported api

From 3c0dc2719753b774e61b75cb36164a490fced86d Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 18 Mar 2019 17:30:34 -0500
Subject: [PATCH 126/245] Excise invalid users on startup

---
 users/index.js | 18 ++++++++++++++++--
 1 file changed, 16 insertions(+), 2 deletions(-)

diff --git a/users/index.js b/users/index.js
index 97384337..7a532944 100644
--- a/users/index.js
+++ b/users/index.js
@@ -49,7 +49,7 @@ exports.setup = async function () {
 
   // load the current users
   users = await db.all(`SELECT * FROM users`)
-  users.forEach(async (user) => {
+  await Promise.all(users.map(async (user) => {
     // massage data
     user.url = normalizeUrl(user.url)
     user.archive = null
@@ -57,15 +57,29 @@ exports.setup = async function () {
     user.createdAt = new Date(user.createdAt)
     logger.info('Loading user', {details: user})
 
-    // fetch the user archive
+    // validate
     try {
       await validateUserUrl(user.url)
+    } catch (e) {
+      user.isInvalid = true
+      return
+    }
+
+    // fetch the user archive
+    try {
       user.archive = await dat.library.getOrLoadArchive(user.url)
       /* dont await */crawler.watchSite(user.archive)
       events.emit('load-user', user)
     } catch (err) {
       logger.error('Failed to load user', {details: {user, err}})
     }
+  }))
+
+  // remove any invalid users
+  var invalids = users.filter(user => user.isInvalid)
+  users = users.filter(user => !user.isInvalid)
+  invalids.forEach(async (invalidUser) => {
+    await db.run(`DELETE FROM users WHERE url = ?`, [invalidUser.url])
   })
 }
 

From d2529ee49c3e7bdcd906bf325780367e82e46f53 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 25 Mar 2019 15:07:41 -0500
Subject: [PATCH 127/245] Add unwalled.garden/bookmark to the crawler and APIs

---
 crawler/bookmarks.js                | 373 ++++++++++++++++++++++++++++
 crawler/index.js                    |   3 +
 crawler/json-schemas/bookmark.js    |  48 ++++
 crawler/search.js                   |  99 +++++++-
 dbs/bookmarks.js                    |  66 ++++-
 dbs/schemas/profile-data.sql.js     |  31 +++
 dbs/schemas/profile-data.v24.sql.js |  35 +++
 scripts/import-schemas.js           |   3 +-
 users/index.js                      |  50 +++-
 web-apis/bg/bookmarks.js            |   7 +
 10 files changed, 700 insertions(+), 15 deletions(-)
 create mode 100644 crawler/bookmarks.js
 create mode 100644 crawler/json-schemas/bookmark.js

diff --git a/crawler/bookmarks.js b/crawler/bookmarks.js
new file mode 100644
index 00000000..6342acff
--- /dev/null
+++ b/crawler/bookmarks.js
@@ -0,0 +1,373 @@
+const assert = require('assert')
+const {URL} = require('url')
+const Events = require('events')
+const Ajv = require('ajv')
+const logger = require('../logger').child({category: 'crawler', dataset: 'bookmarks'})
+const db = require('../dbs/profile-data-db')
+const crawler = require('./index')
+const siteDescriptions = require('./site-descriptions')
+const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename, ensureDirectory} = require('./util')
+const bookmarkSchema = require('./json-schemas/bookmark')
+
+// constants
+// =
+
+const TABLE_VERSION = 1
+const JSON_TYPE = 'unwalled.garden/bookmark'
+const JSON_PATH_REGEX = /^\/data\/bookmarks\/([^/]+)\.json$/i
+
+// typedefs
+// =
+
+/**
+ * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
+ * @typedef {import('./util').CrawlSourceRecord} CrawlSourceRecord
+ * @typedef { import("./site-descriptions").SiteDescription } SiteDescription
+ *
+ * @typedef {Object} Bookmark
+ * @prop {string} pathname
+ * @prop {Object} content
+ * @prop {string} content.href
+ * @prop {string} content.title
+ * @prop {string?} content.description
+ * @prop {string?} content.tags
+ * @prop {number} crawledAt
+ * @prop {number} createdAt
+ * @prop {number} updatedAt
+ * @prop {SiteDescription} author
+ */
+
+// globals
+// =
+
+const events = new Events()
+const ajv = (new Ajv())
+const validateBookmark = ajv.compile(bookmarkSchema)
+const validateBookmarkContent = ajv.compile(bookmarkSchema.properties.content)
+
+// exported api
+// =
+
+exports.on = events.on.bind(events)
+exports.addListener = events.addListener.bind(events)
+exports.removeListener = events.removeListener.bind(events)
+
+/**
+ * @description
+ * Crawl the given site for bookmarks.
+ *
+ * @param {InternalDatArchive} archive - site to crawl.
+ * @param {CrawlSourceRecord} crawlSource - internal metadata about the crawl target.
+ * @returns {Promise}
+ */
+exports.crawlSite = async function (archive, crawlSource) {
+  return doCrawl(archive, crawlSource, 'crawl_bookmarks', TABLE_VERSION, async ({changes, resetRequired}) => {
+    const supressEvents = resetRequired === true // dont emit when replaying old info
+    logger.silly('Crawling bookmarks', {details: {url: archive.url, numChanges: changes.length, resetRequired}})
+    if (resetRequired) {
+      // reset all data
+      logger.debug('Resetting dataset', {details: {url: archive.url}})
+      await db.run(`
+        DELETE FROM crawl_bookmarks WHERE crawlSourceId = ?
+      `, [crawlSource.id])
+      await doCheckpoint('crawl_bookmarks', TABLE_VERSION, crawlSource, 0)
+    }
+
+    // collect changed bookmarks
+    var changedBookmarks = getMatchingChangesInOrder(changes, JSON_PATH_REGEX)
+    if (changedBookmarks.length) {
+      logger.verbose('Collected new/changed bookmark files', {details: {url: archive.url, changedBookmarks: changedBookmarks.map(p => p.name)}})
+    } else {
+      logger.debug('No new bookmark-files found', {details: {url: archive.url}})
+    }
+    emitProgressEvent(archive.url, 'crawl_bookmarks', 0, changedBookmarks.length)
+
+    // read and apply each bookmark in order
+    var progress = 0
+    for (let changedBookmark of changedBookmarks) {
+      // TODO Currently the crawler will abort reading the bookmarks if any bookmark fails to load
+      //      this means that a single unreachable file can stop the forward progress of bookmark indexing
+      //      to solve this, we need to find a way to tolerate unreachable bookmark-files without losing our ability to efficiently detect new bookmarks
+      //      -prf
+      if (changedBookmark.type === 'del') {
+        // delete
+        await db.run(`
+          DELETE FROM crawl_bookmarks WHERE crawlSourceId = ? AND pathname = ?
+        `, [crawlSource.id, changedBookmark.name])
+        events.emit('bookmark-removed', archive.url)
+      } else {
+        // read
+        let bookmarkString
+        try {
+          bookmarkString = await archive.pda.readFile(changedBookmark.name, 'utf8')
+        } catch (err) {
+          logger.warn('Failed to read bookmark file, aborting', {details: {url: archive.url, name: changedBookmark.name, err}})
+          return // abort indexing
+        }
+
+        // parse and validate
+        let bookmark
+        try {
+          bookmark = JSON.parse(bookmarkString)
+          let valid = validateBookmark(bookmark)
+          if (!valid) throw ajv.errorsText(validateBookmark.errors)
+        } catch (err) {
+          logger.warn('Failed to parse bookmark file, skipping', {details: {url: archive.url, name: changedBookmark.name, err}})
+          continue // skip
+        }
+
+        // massage the bookmark
+        bookmark.createdAt = Number(new Date(bookmark.createdAt))
+        bookmark.updatedAt = Number(new Date(bookmark.updatedAt))
+        if (isNaN(bookmark.updatedAt)) bookmark.updatedAt = 0 // optional
+        if (!bookmark.content.description) bookmark.content.description = '' // optional
+        if (!bookmark.content.tags) bookmark.content.tags = '' // optional
+
+        // upsert
+        let existingBookmark = await getBookmark(joinPath(archive.url, changedBookmark.name))
+        if (existingBookmark) {
+          await db.run(`
+            UPDATE crawl_bookmarks
+              SET crawledAt = ?, href = ?, title = ?, description = ?, tags = ?, createdAt = ?, updatedAt = ?
+              WHERE crawlSourceId = ? AND pathname = ?
+          `, [Date.now(), bookmark.content.href, bookmark.content.title, bookmark.content.description, bookmark.content.tags, bookmark.createdAt, bookmark.updatedAt, crawlSource.id, changedBookmark.name])
+          events.emit('bookmark-updated', archive.url)
+        } else {
+          await db.run(`
+            INSERT INTO crawl_bookmarks (crawlSourceId, pathname, crawledAt, href, title, description, tags, createdAt, updatedAt)
+              VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?)
+          `, [crawlSource.id, changedBookmark.name, Date.now(), bookmark.content.href, bookmark.content.title, bookmark.content.description, bookmark.content.tags, bookmark.createdAt, bookmark.updatedAt])
+          events.emit('bookmark-added', archive.url)
+        }
+      }
+
+      // checkpoint our progress
+      logger.silly(`Finished crawling bookmarks`, {details: {url: archive.url}})
+      await doCheckpoint('crawl_bookmarks', TABLE_VERSION, crawlSource, changedBookmark.version)
+      emitProgressEvent(archive.url, 'crawl_bookmarks', ++progress, changedBookmarks.length)
+    }
+  })
+}
+
+/**
+ * @description
+ * List crawled bookmarks.
+ *
+  * @param {Object} [opts]
+  * @param {Object} [opts.filters]
+  * @param {string|string[]} [opts.filters.authors]
+  * @param {number} [opts.offset=0]
+  * @param {number} [opts.limit]
+  * @param {boolean} [opts.reverse]
+ * @returns {Promise<Array<Bookmark>>}
+ */
+exports.query = async function (opts) {
+  // validate & parse params
+  if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+  if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+  if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+  if (opts && opts.filters) {
+    if ('authors' in opts.filters) {
+      if (Array.isArray(opts.filters.authors)) {
+        assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        opts.filters.authors = [opts.filters.authors]
+      }
+      opts.filters.authors = opts.filters.authors.map(toAuthorOrigin)
+    }
+  }
+
+  // build query
+  var query = `
+    SELECT crawl_bookmarks.*, src.url AS crawlSourceUrl FROM crawl_bookmarks
+      INNER JOIN crawl_sources src ON src.id = crawl_bookmarks.crawlSourceId
+  `
+  var values = []
+  if (opts && opts.filters && opts.filters.authors) {
+    let op = 'WHERE'
+    for (let a of opts.filters.authors) {
+      query += ` ${op} src.url = ?`
+      op = 'OR'
+      values.push(a)
+    }
+  }
+  query += ` ORDER BY createdAt`
+  if (opts && opts.reverse) {
+    query += ` DESC`
+  }
+  if (opts && opts.limit) {
+    query += ` LIMIT ?`
+    values.push(opts.limit)
+  }
+  if (opts && opts.offset) {
+    query += ` OFFSET ?`
+    values.push(opts.offset)
+  }
+
+  // execute query
+  var rows = await db.all(query, values)
+  return Promise.all(rows.map(massageBookmarkRow))
+}
+
+/**
+ * @description
+ * Get crawled bookmark.
+ *
+ * @param {string} url - The URL of the bookmark
+ * @returns {Promise<Bookmark>}
+ */
+const getBookmark = exports.getBookmark = async function (url) {
+  // validate & parse params
+  var urlParsed
+  if (url) {
+    try { urlParsed = new URL(url) }
+    catch (e) { throw new Error('Invalid URL: ' + url) }
+  }
+
+  // execute query
+  return await massageBookmarkRow(await db.get(`
+    SELECT
+        crawl_bookmarks.*, src.url AS crawlSourceUrl
+      FROM crawl_bookmarks
+      INNER JOIN crawl_sources src
+        ON src.id = crawl_bookmarks.crawlSourceId
+        AND src.url = ?
+      WHERE
+        crawl_bookmarks.pathname = ?
+  `, [`${urlParsed.protocol}//${urlParsed.hostname}`, urlParsed.pathname]))
+}
+
+/**
+ * @description
+ * Create a new bookmark.
+ *
+ * @param {InternalDatArchive} archive - where to write the bookmark to.
+ * @param {Object} content
+ * @param {string} content.href
+ * @param {string} content.title
+ * @param {string?} content.description
+ * @param {string?|string[]?} content.tags
+ * @returns {Promise<string>} url
+ */
+exports.addBookmark = async function (archive, content) {
+  if (content && Array.isArray(content.tags)) content.tags = content.tags.join(' ')
+  var valid = validateBookmarkContent(content)
+  if (!valid) throw ajv.errorsText(validateBookmarkContent.errors)
+
+  var filename = generateTimeFilename()
+  var filepath = `/data/bookmarks/${filename}.json`
+  await ensureDirectory(archive, '/data')
+  await ensureDirectory(archive, '/data/bookmarks')
+  await archive.pda.writeFile(filepath, JSON.stringify({
+    type: JSON_TYPE,
+    content,
+    createdAt: (new Date()).toISOString()
+  }, null, 2))
+  await crawler.crawlSite(archive)
+  return archive.url + filepath
+}
+
+/**
+ * @description
+ * Update the content of an existing bookmark.
+ *
+ * @param {InternalDatArchive} archive - where to write the bookmark to.
+ * @param {string} pathname - the pathname of the bookmark.
+ * @param {Object} content
+ * @param {string} content.href
+ * @param {string} content.title
+ * @param {string?} content.description
+ * @param {string?|string[]?} content.tags
+ * @returns {Promise<void>}
+ */
+exports.editBookmark = async function (archive, pathname, content) {
+  if (content && Array.isArray(content.tags)) content.tags = content.tags.join(' ')
+  var valid = validateBookmarkContent(content)
+  if (!valid) throw ajv.errorsText(validateBookmarkContent.errors)
+  var oldJson = JSON.parse(await archive.pda.readFile(pathname))
+  await archive.pda.writeFile(pathname, JSON.stringify({
+    type: JSON_TYPE,
+    content,
+    createdAt: oldJson.createdAt,
+    updatedAt: (new Date()).toISOString()
+  }, null, 2))
+  await crawler.crawlSite(archive)
+}
+
+/**
+ * @description
+ * Delete an existing bookmark
+ *
+ * @param {InternalDatArchive} archive - where to write the bookmark to.
+ * @param {string} pathname - the pathname of the bookmark.
+ * @returns {Promise<void>}
+ */
+exports.deleteBookmark = async function (archive, pathname) {
+  assert(typeof pathname === 'string', 'Delete() must be provided a valid URL string')
+  await archive.pda.unlink(pathname)
+  await crawler.crawlSite(archive)
+}
+
+// internal methods
+// =
+
+/**
+ * @param {string} url
+ * @returns {string}
+ */
+function toAuthorOrigin (url) {
+  try {
+    var urlParsed = new URL(url)
+    return urlParsed.protocol + '//' + urlParsed.hostname
+  } catch (e) {
+    throw new Error('Invalid URL: ' + url)
+  }
+}
+
+/**
+ * @param {string} origin
+ * @param {string} pathname
+ * @returns {string}
+ */
+function joinPath (origin, pathname) {
+  if (origin.endsWith('/') && pathname.startsWith('/')) {
+    return origin + pathname.slice(1)
+  }
+  if (!origin.endsWith('/') && !pathname.startsWith('/')) {
+    return origin + '/' + pathname
+  }
+  return origin + pathname
+}
+
+/**
+ * @param {Object} row
+ * @returns {Promise<Bookmark>}
+ */
+async function massageBookmarkRow (row) {
+  if (!row) return null
+  var author = await siteDescriptions.getBest({subject: row.crawlSourceUrl})
+  if (!author) {
+    author = {
+      url: row.crawlSourceUrl,
+      title: '',
+      description: '',
+      type: [],
+      thumbUrl: `${row.crawlSourceUrl}/thumb`,
+      descAuthor: {url: null}
+    }
+  }
+  return {
+    pathname: row.pathname,
+    author,
+    content: {
+      href: row.href,
+      title: row.title,
+      description: row.description,
+      tags: row.tags
+    },
+    crawledAt: row.crawledAt,
+    createdAt: row.createdAt,
+    updatedAt: row.updatedAt
+  }
+}
diff --git a/crawler/index.js b/crawler/index.js
index 5d99e30b..8bf830b9 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -8,6 +8,7 @@ const dat = require('../dat')
 
 const {crawlerEvents, toHostname} = require('./util')
 const feed = require('./feed')
+const bookmarks = require('./bookmarks')
 const followgraph = require('./followgraph')
 const siteDescriptions = require('./site-descriptions')
 
@@ -20,6 +21,7 @@ var watches = {}
 // =
 
 exports.feed = feed
+exports.bookmarks = bookmarks
 exports.followgraph = followgraph
 exports.siteDescriptions = siteDescriptions
 const createEventsStream = exports.createEventsStream = () => emitStream(crawlerEvents)
@@ -82,6 +84,7 @@ exports.crawlSite = async function (archive) {
     // crawl individual sources
     await Promise.all([
       feed.crawlSite(archive, crawlSource),
+      bookmarks.crawlSite(archive, crawlSource),
       followgraph.crawlSite(archive, crawlSource),
       siteDescriptions.crawlSite(archive, crawlSource)
     ])
diff --git a/crawler/json-schemas/bookmark.js b/crawler/json-schemas/bookmark.js
new file mode 100644
index 00000000..0f574cda
--- /dev/null
+++ b/crawler/json-schemas/bookmark.js
@@ -0,0 +1,48 @@
+module.exports = {
+  '$schema': 'http://json-schema.org/draft-07/schema#',
+  '$id': 'dat://unwalled.garden/bookmark.json',
+  'type': 'object',
+  'title': 'Bookmark',
+  'description': 'A saved/shared link to some URL.',
+  'required': ['type', 'content', 'createdAt'],
+  'properties': {
+    'type': {
+      'type': 'string',
+      'title': "The object's type",
+      'const': 'unwalled.garden/bookmark'
+    },
+    'content': {
+      'type': 'object',
+      'required': ['href', 'title'],
+      'properties': {
+        'href': {
+          'type': 'string',
+          'format': 'uri',
+          'examples': [
+            'dat://beakerbrowser.com'
+          ]
+        },
+        'title': {
+          'type': 'string',
+          'maxLength': 280
+        },
+        'description': {
+          'type': 'string',
+          'maxLength': 560
+        },
+        'tags': {
+          'type': 'string',
+          'maxLength': 280
+        }
+      }
+    },
+    'createdAt': {
+      'type': 'string',
+      'format': 'date-time'
+    },
+    'updatedAt': {
+      'type': 'string',
+      'format': 'date-time'
+    }
+  }
+}
\ No newline at end of file
diff --git a/crawler/search.js b/crawler/search.js
index a993b197..ebfabd83 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -70,6 +70,17 @@ const BUILTIN_PAGES = [
  * @prop {string} content.body
  * @prop {number} createdAt
  * @prop {number} updatedAt
+ *
+ * @typedef {Object} BookmarkSearchResult
+ * @prop {SearchResultRecord} record
+ * @prop {string} url
+ * @prop {Object} content
+ * @prop {string} content.href
+ * @prop {string} content.title
+ * @prop {string} content.description
+ * @prop {string} content.tags
+ * @prop {number} createdAt
+ * @prop {number} updatedAt
  */
 
 // exported api
@@ -129,7 +140,7 @@ exports.listSuggestions = async function (query = '', opts = {}) {
  * @param {Object} opts
  * @param {string} [opts.query] - The search query.
  * @param {Object} [opts.filters]
- * @param {string|string[]} [opts.filters.datasets] - Filter results to the given datasets. Defaults to 'all'. Valid values: 'all', 'sites', 'unwalled.garden/post'.
+ * @param {string|string[]} [opts.filters.datasets] - Filter results to the given datasets. Defaults to 'all'. Valid values: 'all', 'sites', 'unwalled.garden/post', 'unwalled.garden/bookmark'.
  * @param {number} [opts.filters.since] - Filter results to items created since the given timestamp.
  * @param {number} [opts.hops=1] - How many hops out in the user's follow graph should be included? Valid values: 1, 2.
  * @param {number} [opts.offset]
@@ -223,6 +234,21 @@ exports.query = async function (user, opts) {
     rows = await Promise.all(rows.map(massagePostSearchResult))
     searchResults.results = searchResults.results.concat(rows)
   }
+  if (datasetValues.includes('all') || datasets.includes('unwalled.garden/bookmark')) {
+    // BOOKMARKS
+    let rows = await db.all(buildBookmarksSearchQuery({
+      query,
+      crawlSourceIds,
+      userCrawlSourceId,
+      since,
+      limit,
+      offset,
+      startHighlight,
+      endHighlight
+    }))
+    rows = await Promise.all(rows.map(massageBookmarkSearchResult))
+    searchResults.results = searchResults.results.concat(rows)
+  }
 
   // sort and apply limit again
   searchResults.results.sort((a, b) => b.record.crawledAt - a.record.crawledAt)
@@ -299,6 +325,43 @@ function buildPostsSearchQuery ({query, crawlSourceIds, userCrawlSourceId, since
   return sql
 }
 
+function buildBookmarksSearchQuery ({query, crawlSourceIds, userCrawlSourceId, since, limit, offset, startHighlight, endHighlight}) {
+  let sql = knex(query ? 'crawl_bookmarks_fts_index' : 'crawl_bookmarks')
+    .select('crawl_bookmarks.pathname')
+    .select('crawl_bookmarks.crawledAt')
+    .select('crawl_bookmarks.createdAt')
+    .select('crawl_bookmarks.updatedAt')
+    .select('crawl_sources.url AS authorUrl')
+    .where(builder => builder
+      .whereIn('crawl_followgraph.crawlSourceId', crawlSourceIds) // published by someone I follow
+      .orWhere('crawl_bookmarks.crawlSourceId', userCrawlSourceId) // or by me
+    )
+    .andWhere('crawl_bookmarks.crawledAt', '>=', since)
+    .orderBy('crawl_bookmarks.crawledAt')
+    .limit(limit)
+    .offset(offset)
+  if (query) {
+    sql = sql
+      .select('crawl_bookmarks.href')
+      .select(knex.raw(`SNIPPET(crawl_bookmarks_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title`))
+      .select(knex.raw(`SNIPPET(crawl_bookmarks_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description`))
+      .select(knex.raw(`SNIPPET(crawl_bookmarks_fts_index, 2, '${startHighlight}', '${endHighlight}', '...', 25) AS tags`))
+      .innerJoin('crawl_bookmarks', 'crawl_bookmarks.rowid', '=', 'crawl_bookmarks_fts_index.rowid')
+      .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_bookmarks.crawlSourceId')
+      .leftJoin('crawl_followgraph', 'crawl_followgraph.destUrl', '=', 'crawl_sources.url')
+      .whereRaw('crawl_bookmarks_fts_index MATCH ?', [query])
+  } else {
+    sql = sql
+      .select('crawl_bookmarks.href')
+      .select('crawl_bookmarks.title')
+      .select('crawl_bookmarks.description')
+      .select('crawl_bookmarks.tags')
+      .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_bookmarks.crawlSourceId')
+      .leftJoin('crawl_followgraph', 'crawl_followgraph.destUrl', '=', 'crawl_sources.url')
+  }
+  return sql
+}
+
 /**
  * @param {Object} row
  * @returns {Promise<SiteSearchResult>}
@@ -354,4 +417,38 @@ async function massagePostSearchResult (row) {
     createdAt: row.createdAt,
     updatedAt: row.updatedAt
   }
+}
+
+/**
+ * @param {Object} row
+ * @returns {Promise<BookmarkSearchResult>}
+ */
+async function massageBookmarkSearchResult (row) {
+  // fetch additional info
+  var author = await siteDescriptions.getBest({subject: row.authorUrl})
+
+  // massage attrs
+  var url = row.authorUrl + row.pathname
+  return {
+    record: {
+      type: 'unwalled.garden/bookmark',
+      url,
+      author: {
+        url: author.url,
+        title: author.title,
+        description: author.description,
+        type: author.type
+      },
+      crawledAt: row.crawledAt,
+    },
+    url,
+    content: {
+      href: row.href,
+      title: row.title,
+      description: row.description,
+      tags: row.tags
+    },
+    createdAt: row.createdAt,
+    updatedAt: row.updatedAt
+  }
 }
\ No newline at end of file
diff --git a/dbs/bookmarks.js b/dbs/bookmarks.js
index fdb47896..a0baa850 100644
--- a/dbs/bookmarks.js
+++ b/dbs/bookmarks.js
@@ -1,4 +1,5 @@
 const assert = require('assert')
+const EventEmitter = require('events')
 const db = require('./profile-data-db')
 const normalizeUrl = require('normalize-url')
 const lock = require('../lib/lock')
@@ -19,41 +20,58 @@ const NORMALIZE_OPTS = {
  * @prop {number} createdAt
  * @prop {string} href
  * @prop {string} title
+ * @prop {string} description
  * @prop {string[]} tags
  * @prop {boolean} pinned
+ * @prop {boolean} public
  * @prop {number} pinOrder
  */
 
+// globals
+// =
+
+const events = new EventEmitter()
+
 // exported methods
 // =
 
+exports.on = events.on.bind(events)
+exports.once = events.once.bind(events)
+exports.removeListener = events.removeListener.bind(events)
+
 /**
  * @param {number} profileId
  * @param {Object} values
  * @param {string} [values.href]
  * @param {string} [values.title]
+ * @param {string} [values.description]
  * @param {string | string[]} [values.tags]
  * @param {boolean} [values.pinned]
+ * @param {boolean} [values.public]
  * @returns {Promise<void>}
  */
-exports.addBookmark = async function (profileId, {href, title, tags, pinned} = {}) {
+exports.addBookmark = async function (profileId, {href, title, description, tags, pinned, public} = {}) {
   // validate
   assertValidHref(href)
   assertValidTitle(title)
-  if (tags) assertValidTags(tags)
+  assertValidDescription(description)
+  assertValidTags(tags)
 
   // massage values
   href = normalizeUrl(href, NORMALIZE_OPTS)
   var tagsStr = tagsToString(tags)
+  description = description || ''
+  public = public || false
 
   // update record
   var release = await lock(`bookmarksdb`)
   try {
     await db.run(`
       INSERT OR REPLACE
-        INTO bookmarks (profileId, url, title, tags, pinned)
-        VALUES (?, ?, ?, ?, ?)
-    `, [profileId, href, title, tagsStr, Number(pinned)])
+        INTO bookmarks (profileId, url, title, description, tags, pinned, public)
+        VALUES (?, ?, ?, ?, ?, ?, ?)
+    `, [profileId, href, title, description, tagsStr, Number(pinned), Number(public)])
+    events.emit('changed')
   } finally {
     release()
   }
@@ -65,15 +83,18 @@ exports.addBookmark = async function (profileId, {href, title, tags, pinned} = {
  * @param {Object} values
  * @param {string} [values.href]
  * @param {string} [values.title]
+ * @param {string} [values.description]
  * @param {string | string[]} [values.tags]
  * @param {boolean} [values.pinned]
+ * @param {boolean} [values.public]
  * @returns {Promise<void>}
  */
-exports.editBookmark = async function (profileId, bookmarkHref, {href, title, tags, pinned} = {}) {
+exports.editBookmark = async function (profileId, bookmarkHref, {href, title, description, tags, pinned, public} = {}) {
   // validate
   assertValidHref(bookmarkHref)
   if (href) assertValidHref(href)
   if (title) assertValidTitle(title)
+  if (description) assertValidDescription(description)
   if (tags) assertValidTags(tags)
 
   // massage values
@@ -92,17 +113,20 @@ exports.editBookmark = async function (profileId, bookmarkHref, {href, title, ta
         .where({profileId, url: bookmarkHref})
       if (typeof href !== 'undefined') sql = sql.update('url', href)
       if (typeof title !== 'undefined') sql = sql.update('title', title)
+      if (typeof description !== 'undefined') sql = sql.update('description', description)
       if (typeof tagsStr !== 'undefined') sql = sql.update('tags', tagsStr)
       if (typeof pinned !== 'undefined') sql = sql.update('pinned', Number(pinned))
+      if (typeof public !== 'undefined') sql = sql.update('public', Number(public))
       await db.run(sql)
     } else {
       // insert record
       await db.run(`
         INSERT OR REPLACE
-          INTO bookmarks (profileId, url, title, tags, pinned)
-          VALUES (?, ?, ?, ?, ?)
-      `, [profileId, href, title, tagsStr, Number(pinned)])
+          INTO bookmarks (profileId, url, title, description, tags, pinned, public)
+          VALUES (?, ?, ?, ?, ?, ?, ?)
+      `, [profileId, href, title, description || '', tagsStr, Number(pinned), Number(public)])
     }
+    events.emit('changed')
   } finally {
     release()
   }
@@ -118,6 +142,7 @@ exports.removeBookmark = async function (profileId, href) {
   var release = await lock(`bookmarksdb`)
   try {
     await db.run(`DELETE FROM bookmarks WHERE profileId = ? AND url = ?`, [profileId, href])
+    events.emit('changed')
   } finally {
     release()
   }
@@ -147,7 +172,7 @@ exports.setBookmarkPinOrder = async function (profileId, urls) {
  */
 exports.getBookmark = async function (profileId, href) {
   href = normalizeUrl(href, NORMALIZE_OPTS)
-  return toNewFormat(await db.get(`SELECT url, title, tags, pinned, pinOrder, createdAt FROM bookmarks WHERE profileId = ? AND url = ?`, [profileId, href]))
+  return toNewFormat(await db.get(`SELECT * FROM bookmarks WHERE profileId = ? AND url = ?`, [profileId, href]))
 }
 
 /**
@@ -156,14 +181,17 @@ exports.getBookmark = async function (profileId, href) {
  * @param {Object} [opts.filters]
  * @param {string|string[]} [opts.filters.tag]
  * @param {boolean} [opts.filters.pinned]
+ * @param {boolean} [opts.filters.public]
  * @returns {Promise<Array<Bookmark>>}
  */
 exports.listBookmarks = async function (profileId, {filters} = {}) {
   let sql = knex('bookmarks')
     .select('url')
     .select('title')
+    .select('description')
     .select('tags')
     .select('pinned')
+    .select('public')
     .select('pinOrder')
     .select('createdAt')
     .where('profileId', '=', profileId)
@@ -171,6 +199,9 @@ exports.listBookmarks = async function (profileId, {filters} = {}) {
   if (filters && filters.pinned) {
     sql = sql.where('pinned', '=', '1')
   }
+  if (filters && 'public' in filters) {
+    sql = sql.where('public', '=', filters.public ? '1' : '0')
+  }
 
   var bookmarks = await db.all(sql)
   bookmarks = bookmarks.map(toNewFormat)
@@ -212,6 +243,9 @@ function tagsToString (v) {
   if (Array.isArray(v)) {
     v = v.join(' ')
   }
+  if (typeof v === 'string') {
+    v = v.replace(/,/g, ' ') // convert any commas to spaces
+  }
   return v
 }
 
@@ -225,8 +259,10 @@ function toNewFormat (b) {
     createdAt: b.createdAt * 1e3, // convert to ms
     href: b.url,
     title: b.title,
+    description: b.description,
     tags: b.tags ? b.tags.split(' ').filter(Boolean) : [],
     pinned: !!b.pinned,
+    public: !!b.public,
     pinOrder: b.pinOrder
   }
 }
@@ -247,11 +283,21 @@ function assertValidTitle (v) {
   assert(v && typeof v === 'string', 'title must be a non-empty string')
 }
 
+/**
+ * @param {string} v
+ * @returns {void}
+ */
+function assertValidDescription (v) {
+  if (!v) return // optional
+  assert(typeof v === 'string', 'title must be a non-empty string')
+}
+
 /**
  * @param {string|string[]} v
  * @returns {void}
  */
 function assertValidTags (v) {
+  if (!v) return // optional
   if (Array.isArray(v)) {
     assert(v.every(item => typeof item === 'string'), 'tags must be a string or array or strings')
   } else {
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index e29774bc..b687a3b8 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -57,6 +57,8 @@ CREATE TABLE bookmarks (
   profileId INTEGER,
   url TEXT NOT NULL,
   title TEXT,
+  description TEXT,
+  public INTEGER,
   pinned INTEGER,
   pinOrder INTEGER DEFAULT 0,
   createdAt INTEGER DEFAULT (strftime('%s', 'now')),
@@ -181,6 +183,35 @@ CREATE TRIGGER crawl_posts_au AFTER UPDATE ON crawl_posts BEGIN
   INSERT INTO crawl_posts_fts_index(rowid, body) VALUES (new.rowid, new.body);
 END;
 
+-- crawled bookmarks
+CREATE TABLE crawl_bookmarks (
+  crawlSourceId INTEGER NOT NULL,
+  pathname TEXT NOT NULL,
+  crawledAt INTEGER,
+
+  href TEXT,
+  title TEXT,
+  description TEXT,
+  tags TEXT,
+  createdAt INTEGER,
+  updatedAt INTEGER,
+
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+CREATE VIRTUAL TABLE crawl_bookmarks_fts_index USING fts5(title, description, tags, content='crawl_bookmarks');
+
+-- triggers to keep crawl_bookmarks_fts_index updated
+CREATE TRIGGER crawl_bookmarks_ai AFTER INSERT ON crawl_bookmarks BEGIN
+  INSERT INTO crawl_bookmarks_fts_index(rowid, title, description, tags) VALUES (new.rowid, new.title, new.description, new.tags);
+END;
+CREATE TRIGGER crawl_bookmarks_ad AFTER DELETE ON crawl_bookmarks BEGIN
+  INSERT INTO crawl_bookmarks_fts_index(crawl_bookmarks_fts_index, rowid, title, description, tags) VALUES('delete', old.rowid, old.title, old.description, old.tags);
+END;
+CREATE TRIGGER crawl_bookmarks_au AFTER UPDATE ON crawl_bookmarks BEGIN
+  INSERT INTO crawl_bookmarks_fts_index(crawl_bookmarks_fts_index, rowid, title, description, tags) VALUES('delete', old.rowid, old.title, old.description, old.tags);
+  INSERT INTO crawl_bookmarks_fts_index(rowid, title, description, tags) VALUES (new.rowid, new.title, new.description, new.tags);
+END;
+
 -- crawled follows
 CREATE TABLE crawl_followgraph (
   crawlSourceId INTEGER NOT NULL,
diff --git a/dbs/schemas/profile-data.v24.sql.js b/dbs/schemas/profile-data.v24.sql.js
index a18af276..5054e18d 100644
--- a/dbs/schemas/profile-data.v24.sql.js
+++ b/dbs/schemas/profile-data.v24.sql.js
@@ -1,5 +1,11 @@
 module.exports = `
 
+-- description of the bookmark's content, often pulled from the bookmarked page
+ALTER TABLE bookmarks ADD COLUMN description TEXT;
+
+-- sync the bookmark to the user's public profile
+ALTER TABLE bookmarks ADD COLUMN public INTEGER;
+
 CREATE TABLE users (
   id INTEGER PRIMARY KEY NOT NULL,
   url TEXT,
@@ -77,6 +83,35 @@ CREATE TRIGGER crawl_posts_au AFTER UPDATE ON crawl_posts BEGIN
   INSERT INTO crawl_posts_fts_index(rowid, body) VALUES (new.rowid, new.body);
 END;
 
+-- crawled bookmarks
+CREATE TABLE crawl_bookmarks (
+  crawlSourceId INTEGER NOT NULL,
+  pathname TEXT NOT NULL,
+  crawledAt INTEGER,
+
+  href TEXT,
+  title TEXT,
+  description TEXT,
+  tags TEXT,
+  createdAt INTEGER,
+  updatedAt INTEGER,
+
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+CREATE VIRTUAL TABLE crawl_bookmarks_fts_index USING fts5(title, description, tags, content='crawl_bookmarks');
+
+-- triggers to keep crawl_bookmarks_fts_index updated
+CREATE TRIGGER crawl_bookmarks_ai AFTER INSERT ON crawl_bookmarks BEGIN
+  INSERT INTO crawl_bookmarks_fts_index(rowid, title, description, tags) VALUES (new.rowid, new.title, new.description, new.tags);
+END;
+CREATE TRIGGER crawl_bookmarks_ad AFTER DELETE ON crawl_bookmarks BEGIN
+  INSERT INTO crawl_bookmarks_fts_index(crawl_bookmarks_fts_index, rowid, title, description, tags) VALUES('delete', old.rowid, old.title, old.description, old.tags);
+END;
+CREATE TRIGGER crawl_bookmarks_au AFTER UPDATE ON crawl_bookmarks BEGIN
+  INSERT INTO crawl_bookmarks_fts_index(crawl_bookmarks_fts_index, rowid, title, description, tags) VALUES('delete', old.rowid, old.title, old.description, old.tags);
+  INSERT INTO crawl_bookmarks_fts_index(rowid, title, description, tags) VALUES (new.rowid, new.title, new.description, new.tags);
+END;
+
 -- crawled follows
 CREATE TABLE crawl_followgraph (
   crawlSourceId INTEGER NOT NULL,
diff --git a/scripts/import-schemas.js b/scripts/import-schemas.js
index 709866cf..62285a6d 100644
--- a/scripts/import-schemas.js
+++ b/scripts/import-schemas.js
@@ -6,7 +6,8 @@ const rimraf = require('rimraf')
 const SCHEMAS = [
   'comment',
   'follows',
-  'post'
+  'post',
+  'bookmark'
 ]
 
 console.log('')
diff --git a/users/index.js b/users/index.js
index 7a532944..0a36b907 100644
--- a/users/index.js
+++ b/users/index.js
@@ -2,9 +2,13 @@ const Events = require('events')
 const logger = require('../logger').category('crawler')
 const dat = require('../dat')
 const crawler = require('../crawler')
-const followgraph = require('../crawler/followgraph')
+const followgraphCrawler = require('../crawler/followgraph')
+const bookmarksCrawler = require('../crawler/bookmarks')
 const db = require('../dbs/profile-data-db')
 const archivesDb = require('../dbs/archives')
+const bookmarksDb = require('../dbs/bookmarks')
+const _isEqual = require('lodash.isequal')
+const _pick = require('lodash.pick')
 
 // constants
 // =
@@ -73,6 +77,9 @@ exports.setup = async function () {
     } catch (err) {
       logger.error('Failed to load user', {details: {user, err}})
     }
+
+    // start any active processes
+    watchAndSyncBookmarks(user)
   }))
 
   // remove any invalid users
@@ -244,10 +251,10 @@ async function selectNextCrawlTargets (user) {
   var rows = [user.url]
 
   // get followed sites
-  rows = rows.concat(await followgraph.listFollows(user.url))
+  rows = rows.concat(await followgraphCrawler.listFollows(user.url))
 
   // get sites followed by followed sites
-  rows = rows.concat(await followgraph.listFoaFs(user.url))
+  rows = rows.concat(await followgraphCrawler.listFoaFs(user.url))
 
   // assemble into list
   var start = user.crawlSelectorCursor || 0
@@ -309,3 +316,40 @@ async function validateUserUrl (url) {
     throw new Error('User dat has been deleted')
   }
 }
+
+/**
+ * @param {Object} user 
+ * @returns {void}
+ */
+function watchAndSyncBookmarks (user) {
+  // TODO support multiple users
+  syncBookmarks()
+  bookmarksDb.on('changed', syncBookmarks)
+
+  function pickBookmarkAttrs (b) {
+    return _pick(b, ['href', 'title', 'description', 'tags'])
+  }
+
+  async function syncBookmarks () {
+    // fetch current public bookmarks
+    var publicBookmarks = await bookmarksDb.listBookmarks(0, {filters: {public: true}})
+    var publishedBookmarks = await bookmarksCrawler.query({filters: {authors: user.url}})
+
+    // diff and publish changes
+    for (let b of publicBookmarks) {
+      b.tags = b.tags.join(' ')
+      let existing = publishedBookmarks.find(b2 => b.href === b2.content.href)
+      if (!existing) {
+        await bookmarksCrawler.addBookmark(user.archive, pickBookmarkAttrs(b)) // add
+      } else {
+        if (!_isEqual(pickBookmarkAttrs(b), existing.content)) {
+          await bookmarksCrawler.editBookmark(user.archive, existing.pathname, pickBookmarkAttrs(b)) // update
+        }
+      }
+    }
+    for (let b of publishedBookmarks) {
+      let existing = publicBookmarks.find(b2 => b2.href === b.content.href)
+      if (!existing) await bookmarksCrawler.deleteBookmark(user.archive, b.pathname) // remove
+    }
+  }
+}
\ No newline at end of file
diff --git a/web-apis/bg/bookmarks.js b/web-apis/bg/bookmarks.js
index 8ab904d1..331bbbf2 100644
--- a/web-apis/bg/bookmarks.js
+++ b/web-apis/bg/bookmarks.js
@@ -10,8 +10,10 @@ const bookmarksDb = require('../../dbs/bookmarks')
  * @prop {number} createdAt
  * @prop {string} href
  * @prop {string} title
+ * @prop {string} description
  * @prop {string[]} tags
  * @prop {boolean} pinned
+ * @prop {boolean} public
  * @prop {number} pinOrder
  */
 
@@ -24,6 +26,7 @@ module.exports = {
    * @param {Object} [opts.filters]
    * @param {string|string[]} [opts.filters.tag]
    * @param {boolean} [opts.filters.pinned]
+   * @param {boolean} [opts.filters.public]
    * @returns {Promise<BookmarkPublicAPIRecord[]>}
    */
   async list (opts) {
@@ -66,8 +69,10 @@ module.exports = {
    * @param {Object} data
    * @param {string} [data.href]
    * @param {string} [data.title]
+   * @param {string} [data.description]
    * @param {string | string[]} [data.tags]
    * @param {boolean} [data.pinned]
+   * @param {boolean} [data.public]
    * @returns {Promise<void>}
    */
   async add (data) {
@@ -80,8 +85,10 @@ module.exports = {
    * @param {Object} data
    * @param {string} [data.href]
    * @param {string} [data.title]
+   * @param {string} [data.description]
    * @param {string | string[]} [data.tags]
    * @param {boolean} [data.pinned]
+   * @param {boolean} [data.public]
    * @returns {Promise<void>}
    */
   async edit (href, data = {}) {

From 33d7abda731e520bf5169ccd613a0f4e123c60b6 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 26 Mar 2019 12:48:29 -0500
Subject: [PATCH 128/245] Rework bookmarks web api to include public bookmarks

---
 dbs/bookmarks.js                         | 16 +---
 users/index.js                           |  2 +-
 web-apis/bg/bookmarks.js                 | 97 +++++++++++++++++++++++-
 web-apis/bg/unwalled-garden-feed.js      |  1 -
 web-apis/manifests/external/bookmarks.js |  2 +-
 5 files changed, 97 insertions(+), 21 deletions(-)

diff --git a/dbs/bookmarks.js b/dbs/bookmarks.js
index a0baa850..8372eaaa 100644
--- a/dbs/bookmarks.js
+++ b/dbs/bookmarks.js
@@ -179,7 +179,6 @@ exports.getBookmark = async function (profileId, href) {
  * @param {number} profileId
  * @param {Object} [opts]
  * @param {Object} [opts.filters]
- * @param {string|string[]} [opts.filters.tag]
  * @param {boolean} [opts.filters.pinned]
  * @param {boolean} [opts.filters.public]
  * @returns {Promise<Array<Bookmark>>}
@@ -204,20 +203,7 @@ exports.listBookmarks = async function (profileId, {filters} = {}) {
   }
 
   var bookmarks = await db.all(sql)
-  bookmarks = bookmarks.map(toNewFormat)
-
-  // apply tag filter
-  if (filters && filters.tag) {
-    if (Array.isArray(filters.tag)) {
-      bookmarks = bookmarks.filter(b => {
-        return /** @type string[] */(filters.tag).reduce((agg, t) => agg && b.tags.includes(t), true)
-      })
-    } else {
-      bookmarks = bookmarks.filter(b => b.tags.includes(filters.tag))
-    }
-  }
-
-  return bookmarks
+  return bookmarks.map(toNewFormat)
 }
 
 /**
diff --git a/users/index.js b/users/index.js
index 0a36b907..fcb0b86b 100644
--- a/users/index.js
+++ b/users/index.js
@@ -318,7 +318,7 @@ async function validateUserUrl (url) {
 }
 
 /**
- * @param {Object} user 
+ * @param {Object} user
  * @returns {void}
  */
 function watchAndSyncBookmarks (user) {
diff --git a/web-apis/bg/bookmarks.js b/web-apis/bg/bookmarks.js
index 331bbbf2..09f6c084 100644
--- a/web-apis/bg/bookmarks.js
+++ b/web-apis/bg/bookmarks.js
@@ -1,12 +1,23 @@
 const globals = require('../../globals')
 const {PermissionsError} = require('beaker-error-constants')
 const bookmarksDb = require('../../dbs/bookmarks')
+const bookmarksCrawler = require('../../crawler/bookmarks')
+const siteDescriptions = require('../../crawler/site-descriptions')
+const {toOrigin} = require('../../crawler/util')
+const _get = require('lodash.get')
 
 // typedefs
 // =
 
 /**
+ * @typedef {Object} BookmarkAuthorPublicAPIRecord
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {string[]} type
+ *
  * @typedef {Object} BookmarkPublicAPIRecord
+ * @prop {BookmarkAuthorPublicAPIRecord} author
  * @prop {number} createdAt
  * @prop {string} href
  * @prop {string} title
@@ -14,6 +25,7 @@ const bookmarksDb = require('../../dbs/bookmarks')
  * @prop {string[]} tags
  * @prop {boolean} pinned
  * @prop {boolean} public
+ * @prop {boolean} isOwner
  * @prop {number} pinOrder
  */
 
@@ -24,14 +36,70 @@ module.exports = {
   /**
    * @param {Object} [opts]
    * @param {Object} [opts.filters]
+   * @param {string|string[]} [opts.filters.authors]
    * @param {string|string[]} [opts.filters.tag]
    * @param {boolean} [opts.filters.pinned]
    * @param {boolean} [opts.filters.public]
    * @returns {Promise<BookmarkPublicAPIRecord[]>}
    */
-  async list (opts) {
+  async query (opts) {
     await assertPermission(this.sender, 'dangerousAppControl')
-    return bookmarksDb.listBookmarks(0, opts)
+
+    // fetch user
+    var userSession = globals.userSessionAPI.getFor(this.sender)
+    if (!userSession) throw new Error('No active user session')
+    var user = await siteDescriptions.getBest({subject: userSession.url, author: userSession.url})
+
+    // massage params
+    var tagFilter = _get(opts, 'filters.tag', undefined)
+    var pinnedFilter = _get(opts, 'filters.pinned', undefined)
+    var publicFilter = _get(opts, 'filters.public', undefined)
+    var authorsFilter = _get(opts, 'filters.authors', undefined)
+    if (authorsFilter) {
+      if (!Array.isArray(authorsFilter)) authorsFilter = [authorsFilter]
+      authorsFilter = authorsFilter.map(toOrigin).filter(Boolean)
+    }
+
+    // if the pinned filter is truthy, only fetch from the local database
+    // (the bookmarksCrawler cant filter on 'pinned' and we only need local results anyway)
+    if (pinnedFilter) publicFilter = false
+
+    // construct results
+    var bookmarks = []
+    if (publicFilter === undefined || publicFilter === false) {
+      // only fetch local results if there is no authors filter or if the authors filter includes the user
+      if (!authorsFilter || authorsFilter.includes(userSession.url)) {
+        let internalBoookmarks = await bookmarksDb.listBookmarks(0, opts)
+        bookmarks = bookmarks.concat(internalBoookmarks.map(b => normalizeInternalBookmark(b, user)))
+      }
+    }
+    if (publicFilter === undefined || publicFilter === true) {
+      let uwFilters = {}
+      if (authorsFilter) uwFilters.authors = authorsFilter
+      let uwBookmarks = await bookmarksCrawler.query({filters: uwFilters})
+      if (publicFilter === undefined) {
+        // filter out the user's bookmarks, because they'll be duplicates
+        uwBookmarks = uwBookmarks.filter(b => b.author.url !== user.url)
+      }
+      let pinneds = await bookmarksDb.listBookmarks(0, {filters: {pinned: true}})
+      bookmarks = bookmarks.concat(uwBookmarks.map(b => normalizeUWBookmark(b, user, pinneds)))
+    }
+
+    // apply tag filter
+    if (tagFilter) {
+      if (Array.isArray(tagFilter)) {
+        bookmarks = bookmarks.filter(b => {
+          return /** @type string[] */(tagFilter).reduce((agg, t) => agg && b.tags.includes(t), true)
+        })
+      } else {
+        bookmarks = bookmarks.filter(b => b.tags.includes(tagFilter))
+      }
+    }
+
+    // apply sorting
+    bookmarks.sort((a, b) => (a.title || '').localeCompare(b.title || ''))
+
+    return bookmarks
   },
 
   /**
@@ -48,7 +116,14 @@ module.exports = {
    */
   async get (href) {
     await assertPermission(this.sender, 'dangerousAppControl')
-    return bookmarksDb.getBookmark(0, href)
+
+    // fetch user
+    var userSession = globals.userSessionAPI.getFor(this.sender)
+    if (!userSession) throw new Error('No active user session')
+    var user = await siteDescriptions.getBest({subject: userSession.url, author: userSession.url})
+
+    // fetch bookmark
+    return normalizeInternalBookmark(await bookmarksDb.getBookmark(0, href), user)
   },
 
   /**
@@ -126,3 +201,19 @@ async function assertPermission (sender, perm) {
   if (await globals.permsAPI.requestPermission(perm, sender)) return true
   throw new PermissionsError()
 }
+
+function normalizeInternalBookmark (bookmark, user) {
+  bookmark.author = user
+  bookmark.isOwner = true
+  return bookmark
+}
+
+function normalizeUWBookmark (uwBookmark, user, pinneds) {
+  var bookmark = uwBookmark.content
+  bookmark.tags = bookmark.tags.split(' ').filter(Boolean)
+  bookmark.public = true
+  bookmark.author = uwBookmark.author
+  bookmark.isOwner = bookmark.author.url === user.url
+  bookmark.pinned = bookmark.isOwner && pinneds.find(p => p.href === bookmark.href)
+  return bookmark
+}
diff --git a/web-apis/bg/unwalled-garden-feed.js b/web-apis/bg/unwalled-garden-feed.js
index 63ec5467..bc55688c 100644
--- a/web-apis/bg/unwalled-garden-feed.js
+++ b/web-apis/bg/unwalled-garden-feed.js
@@ -105,7 +105,6 @@ module.exports = {
     var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
     var filepath = await urlToFilepath(url, userSession.url)
-    console.log('got filepath', url, filepath)
 
     var userArchive = dat.library.getArchive(userSession.url)
     await feedCrawler.editPost(userArchive, filepath, post.content)
diff --git a/web-apis/manifests/external/bookmarks.js b/web-apis/manifests/external/bookmarks.js
index f841f449..336d0e8f 100644
--- a/web-apis/manifests/external/bookmarks.js
+++ b/web-apis/manifests/external/bookmarks.js
@@ -1,5 +1,5 @@
 module.exports = {
-  list: 'promise',
+  query: 'promise',
   listTags: 'promise',
   get: 'promise',
   has: 'promise',

From 00fe113e25ac80f068b9a44813efb3a42558a055 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 27 Mar 2019 13:45:47 -0500
Subject: [PATCH 129/245] Protect the user archives from deletion

---
 users/index.js             | 12 +++++++-----
 web-apis/bg/archives.js    | 26 ++++++++++----------------
 web-apis/bg/dat-archive.js | 15 +++++++--------
 web-apis/bg/library.js     | 12 +++++++++++-
 4 files changed, 35 insertions(+), 30 deletions(-)

diff --git a/users/index.js b/users/index.js
index fcb0b86b..bf4b4449 100644
--- a/users/index.js
+++ b/users/index.js
@@ -216,17 +216,19 @@ exports.remove = async function (url) {
   events.emit('unload-user', user)
 }
 
-// internal methods
-// =
-
 /**
  * @param {string} url
  * @return {Promise<boolean>}
  */
-async function isUser (url) {
-  return !!(await get(url))
+const isUser =
+exports.isUser = function (url) {
+  url = normalizeUrl(url)
+  return !!users.find(user => user.url === url)
 }
 
+// internal methods
+// =
+
 /**
  * Assembles a list of crawl targets based on the current database state.
  * Depends on NUM_SIMULTANEOUS_CRAWLS.
diff --git a/web-apis/bg/archives.js b/web-apis/bg/archives.js
index 0a877bcd..88b11a80 100644
--- a/web-apis/bg/archives.js
+++ b/web-apis/bg/archives.js
@@ -1,9 +1,6 @@
 const path = require('path')
-const assert = require('assert')
-const {URL} = require('url')
 const mkdirp = require('mkdirp')
 const jetpack = require('fs-jetpack')
-const globals = require('../../globals')
 const datDns = require('../../dat/dns')
 const datLibrary = require('../../dat/library')
 const datGC = require('../../dat/garbage-collector')
@@ -11,7 +8,8 @@ const archivesDb = require('../../dbs/archives')
 const archiveDraftsDb = require('../../dbs/archive-drafts')
 const {cbPromise} = require('../../lib/functions')
 const {timer} = require('../../lib/time')
-const lock = require('../../lib/lock')
+const users = require('../../users')
+const {PermissionsError} = require('beaker-error-constants')
 
 // exported api
 // =
@@ -53,6 +51,7 @@ module.exports = {
 
   async remove (url) {
     var key = await datLibrary.fromURLToKey(url, true)
+    assertArchiveDeletable(key)
     return archivesDb.setUserSettings(0, key, {isSaved: false})
   },
 
@@ -66,7 +65,7 @@ module.exports = {
 
     for (var i = 0; i < urls.length; i++) {
       let key = await datLibrary.fromURLToKey(urls[i], true)
-
+      assertArchiveDeletable(key)
       results.push(await archivesDb.setUserSettings(0, key, {isSaved: false}))
     }
     return results
@@ -74,6 +73,7 @@ module.exports = {
 
   async delete (url) {
     const key = await datLibrary.fromURLToKey(url, true)
+    assertArchiveDeletable(key)
     const drafts = await archiveDraftsDb.list(0, key)
     const toDelete = [{key}].concat(drafts)
     var bytes = 0
@@ -306,14 +306,8 @@ module.exports = {
 // internal methods
 // =
 
-function getOrigin (url) {
-  try {
-    url = new URL(url)
-    return url.protocol + '//' + url.hostname
-  } catch (e) {}
-  return null
-}
-
-function assertString (v, msg) {
-  assert(!!v && typeof v === 'string', msg)
-}
+function assertArchiveDeletable (key) {
+  if (users.isUser(`dat://${key}`)) {
+    throw new PermissionsError('Unable to delete the user profile.')
+  }
+}
\ No newline at end of file
diff --git a/web-apis/bg/dat-archive.js b/web-apis/bg/dat-archive.js
index 184b230a..552ab960 100644
--- a/web-apis/bg/dat-archive.js
+++ b/web-apis/bg/dat-archive.js
@@ -9,7 +9,7 @@ const datDns = require('../../dat/dns')
 const datLibrary = require('../../dat/library')
 const archivesDb = require('../../dbs/archives')
 const {timer} = require('../../lib/time')
-const scopedFSes = require('../../lib/scoped-fses')
+const users = require('../../users')
 const {
   DAT_MANIFEST_FILENAME,
   DAT_CONFIGURABLE_FIELDS,
@@ -129,7 +129,7 @@ module.exports = {
   async unlinkArchive (url) {
     var {archive} = await lookupArchive(this.sender, url)
     await assertDeleteArchivePermission(archive, this.sender)
-    await assertArchiveDeletable(archive)
+    assertArchiveDeletable(archive)
     await archivesDb.setUserSettings(0, archive.key, {isSaved: false})
   },
 
@@ -626,12 +626,11 @@ async function assertArchiveOfflineable (archive) {
   // }
 }
 
-async function assertArchiveDeletable (archive) {
-  // TODO(profiles) disabled -prf
-  // var profileRecord = await getProfileRecord(0)
-  // if ('dat://' + archive.key.toString('hex') === profileRecord.url) {
-  //   throw new PermissionsError('Unable to delete the user archive.')
-  // }
+function assertArchiveDeletable (archive) {
+  var archiveUrl = 'dat://' + archive.key.toString('hex')
+  if (users.isUser(archiveUrl)) {
+    throw new PermissionsError('Unable to delete the user profile.')
+  }
 }
 
 async function assertQuotaPermission (archive, senderOrigin, byteLength) {
diff --git a/web-apis/bg/library.js b/web-apis/bg/library.js
index 6f813757..ffcc2c54 100644
--- a/web-apis/bg/library.js
+++ b/web-apis/bg/library.js
@@ -2,6 +2,7 @@ const globals = require('../../globals')
 const through2 = require('through2')
 const datLibrary = require('../../dat/library')
 const archivesDb = require('../../dbs/archives')
+const users = require('../../users')
 const {PermissionsError} = require('beaker-error-constants')
 
 // typedefs
@@ -71,6 +72,7 @@ function remove (isRequest) {
   return async function (url) {
     await assertPermission(this.sender, 'dangerousAppControl')
     var key = await datLibrary.fromURLToKey(url, true)
+    assertArchiveDeletable(key)
 
     if (isRequest) {
       await checkIsntOwner(key)
@@ -183,7 +185,9 @@ module.exports = {
    */
   async uncache (url) {
     await assertPermission(this.sender, 'dangerousAppControl')
-    await datLibrary.clearFileCache(await datLibrary.fromURLToKey(url, true))
+    var key = await datLibrary.fromURLToKey(url, true)
+    assertArchiveDeletable(key)
+    await datLibrary.clearFileCache(key)
   },
 
   async createEventStream () {
@@ -224,6 +228,12 @@ module.exports = {
 // internal methods
 // =
 
+function assertArchiveDeletable (key) {
+  if (users.isUser(`dat://${key}`)) {
+    throw new PermissionsError('Unable to delete the user profile.')
+  }
+}
+
 async function checkIsntOwner (key) {
   var meta = await archivesDb.getMeta(key)
   if (meta.isOwner) throw new PermissionsError('Archive is owned by user')

From 42e384f0f3cffc50117226926153ab9cb6df4883 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 29 Mar 2019 12:49:01 -0500
Subject: [PATCH 130/245] Add dryRun option to DatArchive.importFromFilesystem

---
 package-lock.json          | 14 +++++++-------
 package.json               |  2 +-
 web-apis/bg/dat-archive.js |  3 ++-
 3 files changed, 10 insertions(+), 9 deletions(-)

diff --git a/package-lock.json b/package-lock.json
index d2d864b6..556620f0 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -1356,7 +1356,7 @@
     },
     "expand-range": {
       "version": "1.8.2",
-      "resolved": "http://registry.npmjs.org/expand-range/-/expand-range-1.8.2.tgz",
+      "resolved": "https://registry.npmjs.org/expand-range/-/expand-range-1.8.2.tgz",
       "integrity": "sha1-opnv/TNf4nIeuujiV+x5ZE/IUzc=",
       "requires": {
         "fill-range": "^2.1.0"
@@ -2747,9 +2747,9 @@
       }
     },
     "math-random": {
-      "version": "1.0.1",
-      "resolved": "https://registry.npmjs.org/math-random/-/math-random-1.0.1.tgz",
-      "integrity": "sha1-izqsWIuKZuSXXjzepn97sylgH6w="
+      "version": "1.0.4",
+      "resolved": "https://registry.npmjs.org/math-random/-/math-random-1.0.4.tgz",
+      "integrity": "sha512-rUxjysqif/BZQH2yhd5Aaq7vXMSx9NdEsQcyA07uEzIvxgI7zIr33gGsh+RU0/XjmQpCW7RsVof1vlkvQVCK5A=="
     },
     "mdurl": {
       "version": "1.0.1",
@@ -3334,9 +3334,9 @@
       "integrity": "sha1-v8zcjfWxLcUsi0PsONGNcsBLqW0="
     },
     "pauls-dat-api": {
-      "version": "8.0.4",
-      "resolved": "https://registry.npmjs.org/pauls-dat-api/-/pauls-dat-api-8.0.4.tgz",
-      "integrity": "sha512-bQFDq388DMeizizk7ldIc9U9QZP0C61Y9vOlZwIUpSuOpjHVSClgQz/Y4wzAOUz7xecAMTEM+xThk3s/u7B3cA==",
+      "version": "8.1.0",
+      "resolved": "https://registry.npmjs.org/pauls-dat-api/-/pauls-dat-api-8.1.0.tgz",
+      "integrity": "sha512-DTxj5BIPjKJ5dDgQJxMsUfTVUVVi6RSgR3AWz4dl6pwAmQoh4YMYz+cfwfoQRIituMUdczRJkbs/JXD9yaa8dQ==",
       "requires": {
         "anymatch": "^1.3.2",
         "beaker-error-constants": "^1.4.0",
diff --git a/package.json b/package.json
index 0c703a05..892aa8a4 100644
--- a/package.json
+++ b/package.json
@@ -69,7 +69,7 @@
     "once": "^1.4.0",
     "os-locale": "^3.1.0",
     "parse-dat-url": "^3.0.1",
-    "pauls-dat-api": "^8.0.4",
+    "pauls-dat-api": "^8.1.0",
     "pify": "^3.0.0",
     "pump": "^3.0.0",
     "random-access-file": "^2.0.1",
diff --git a/web-apis/bg/dat-archive.js b/web-apis/bg/dat-archive.js
index 552ab960..a04724f8 100644
--- a/web-apis/bg/dat-archive.js
+++ b/web-apis/bg/dat-archive.js
@@ -494,7 +494,8 @@ module.exports = {
       dstArchive: checkoutFS,
       dstPath: filepath,
       ignore: opts.ignore,
-      inplaceImport: opts.inplaceImport !== false
+      inplaceImport: opts.inplaceImport !== false,
+      dryRun: opts.dryRun
     })
   },
 

From 0ec90555120b30c548a33d7bfd338a791c315471 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 1 Apr 2019 12:37:41 -0500
Subject: [PATCH 131/245] Rename unwalled-garden-feed API to
 unwalled-garden-posts

---
 crawler/index.js                              |  6 ++--
 crawler/{feed.js => posts.js}                 |  0
 package-lock.json                             |  2 +-
 web-apis/bg.js                                |  6 ++--
 ...arden-feed.js => unwalled-garden-posts.js} | 30 +++++++++----------
 web-apis/fg/navigator-import.js               |  6 ++--
 ...arden-feed.js => unwalled-garden-posts.js} |  0
 7 files changed, 25 insertions(+), 25 deletions(-)
 rename crawler/{feed.js => posts.js} (100%)
 rename web-apis/bg/{unwalled-garden-feed.js => unwalled-garden-posts.js} (86%)
 rename web-apis/manifests/external/{unwalled-garden-feed.js => unwalled-garden-posts.js} (100%)

diff --git a/crawler/index.js b/crawler/index.js
index 8bf830b9..addbe05d 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -7,7 +7,7 @@ const archivesDb = require('../dbs/archives')
 const dat = require('../dat')
 
 const {crawlerEvents, toHostname} = require('./util')
-const feed = require('./feed')
+const posts = require('./posts')
 const bookmarks = require('./bookmarks')
 const followgraph = require('./followgraph')
 const siteDescriptions = require('./site-descriptions')
@@ -20,7 +20,7 @@ var watches = {}
 // exported api
 // =
 
-exports.feed = feed
+exports.posts = posts
 exports.bookmarks = bookmarks
 exports.followgraph = followgraph
 exports.siteDescriptions = siteDescriptions
@@ -83,7 +83,7 @@ exports.crawlSite = async function (archive) {
 
     // crawl individual sources
     await Promise.all([
-      feed.crawlSite(archive, crawlSource),
+      posts.crawlSite(archive, crawlSource),
       bookmarks.crawlSite(archive, crawlSource),
       followgraph.crawlSite(archive, crawlSource),
       siteDescriptions.crawlSite(archive, crawlSource)
diff --git a/crawler/feed.js b/crawler/posts.js
similarity index 100%
rename from crawler/feed.js
rename to crawler/posts.js
diff --git a/package-lock.json b/package-lock.json
index 556620f0..4981665f 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -1356,7 +1356,7 @@
     },
     "expand-range": {
       "version": "1.8.2",
-      "resolved": "https://registry.npmjs.org/expand-range/-/expand-range-1.8.2.tgz",
+      "resolved": "http://registry.npmjs.org/expand-range/-/expand-range-1.8.2.tgz",
       "integrity": "sha1-opnv/TNf4nIeuujiV+x5ZE/IUzc=",
       "requires": {
         "fill-range": "^2.1.0"
diff --git a/web-apis/bg.js b/web-apis/bg.js
index 1cf3417a..da94ae95 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -29,7 +29,7 @@ const bookmarksManifest = require('./manifests/external/bookmarks')
 const libraryManifest = require('./manifests/external/library')
 const profilesManifest = require('./manifests/external/profiles')
 const searchManifest = require('./manifests/external/search')
-const feedManifest = require('./manifests/external/unwalled-garden-feed')
+const postsManifest = require('./manifests/external/unwalled-garden-posts')
 const followgraphManifest = require('./manifests/external/unwalled-garden-followgraph')
 
 // external apis
@@ -39,7 +39,7 @@ const bookmarksAPI = require('./bg/bookmarks')
 const libraryAPI = require('./bg/library')
 const profilesAPI = require('./bg/profiles')
 const searchAPI = require('./bg/search')
-const feedAPI = require('./bg/unwalled-garden-feed')
+const postsAPI = require('./bg/unwalled-garden-posts')
 const followgraphAPI = require('./bg/unwalled-garden-followgraph')
 
 // experimental manifests
@@ -74,7 +74,7 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('library', libraryManifest, libraryAPI, secureOnly)
   globals.rpcAPI.exportAPI('profiles', profilesManifest, profilesAPI, secureOnly)
   globals.rpcAPI.exportAPI('search', searchManifest, searchAPI, secureOnly)
-  globals.rpcAPI.exportAPI('unwalled-garden-feed', feedManifest, feedAPI, secureOnly)
+  globals.rpcAPI.exportAPI('unwalled-garden-posts', postsManifest, postsAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-followgraph', followgraphManifest, followgraphAPI, secureOnly)
 
   // experimental apis
diff --git a/web-apis/bg/unwalled-garden-feed.js b/web-apis/bg/unwalled-garden-posts.js
similarity index 86%
rename from web-apis/bg/unwalled-garden-feed.js
rename to web-apis/bg/unwalled-garden-posts.js
index bc55688c..96d0cee2 100644
--- a/web-apis/bg/unwalled-garden-feed.js
+++ b/web-apis/bg/unwalled-garden-posts.js
@@ -3,26 +3,26 @@ const assert = require('assert')
 const {URL} = require('url')
 const {PermissionsError} = require('beaker-error-constants')
 const dat = require('../../dat')
-const feedCrawler = require('../../crawler/feed')
+const postsCrawler = require('../../crawler/posts')
 
 // typedefs
 // =
 
 /**
- * @typedef {Object} FeedAuthorPublicAPIRecord
+ * @typedef {Object} PostAuthorPublicAPIRecord
  * @prop {string} url
  * @prop {string} title
  * @prop {string} description
  * @prop {string[]} type
  *
- * @typedef {Object} FeedPostPublicAPIRecord
+ * @typedef {Object} PostPublicAPIRecord
  * @prop {string} url
  * @prop {Object} content
  * @prop {string} content.body
  * @prop {number} crawledAt
  * @prop {number} createdAt
  * @prop {number} updatedAt
- * @prop {FeedAuthorPublicAPIRecord} author
+ * @prop {PostAuthorPublicAPIRecord} author
  */
 
 // exported api
@@ -37,7 +37,7 @@ module.exports = {
    * @param {number} [opts.offset=0]
    * @param {number} [opts.limit]
    * @param {boolean} [opts.reverse]
-   * @returns {Promise<FeedPostPublicAPIRecord[]>}
+   * @returns {Promise<PostPublicAPIRecord[]>}
    */
   async query (opts) {
     await assertPermission(this.sender, 'dangerousAppControl')
@@ -53,24 +53,24 @@ module.exports = {
         }
       }
     }
-    var posts = await feedCrawler.query(opts)
+    var posts = await postsCrawler.query(opts)
     return Promise.all(posts.map(massagePostRecord))
   },
 
   /**
    * @param {string} url
-   * @returns {Promise<FeedPostPublicAPIRecord>}
+   * @returns {Promise<PostPublicAPIRecord>}
    */
   async getPost (url) {
     await assertPermission(this.sender, 'dangerousAppControl')
-    return massagePostRecord(await feedCrawler.getPost(url))
+    return massagePostRecord(await postsCrawler.getPost(url))
   },
 
   /**
    * @param {Object} post
    * @param {Object} post.content
    * @param {string} post.content.body
-   * @returns {Promise<FeedPostPublicAPIRecord>}
+   * @returns {Promise<PostPublicAPIRecord>}
    */
   async addPost (post) {
     await assertPermission(this.sender, 'dangerousAppControl')
@@ -83,8 +83,8 @@ module.exports = {
     if (!userSession) throw new Error('No active user session')
 
     var userArchive = dat.library.getArchive(userSession.url)
-    var url = await feedCrawler.addPost(userArchive, post.content)
-    return massagePostRecord(await feedCrawler.getPost(url))
+    var url = await postsCrawler.addPost(userArchive, post.content)
+    return massagePostRecord(await postsCrawler.getPost(url))
   },
 
   /**
@@ -92,7 +92,7 @@ module.exports = {
    * @param {Object} post
    * @param {Object} post.content
    * @param {string} post.content.body
-   * @returns {Promise<FeedPostPublicAPIRecord>}
+   * @returns {Promise<PostPublicAPIRecord>}
    */
   async editPost (url, post) {
     await assertPermission(this.sender, 'dangerousAppControl')
@@ -107,8 +107,8 @@ module.exports = {
     var filepath = await urlToFilepath(url, userSession.url)
 
     var userArchive = dat.library.getArchive(userSession.url)
-    await feedCrawler.editPost(userArchive, filepath, post.content)
-    return massagePostRecord(await feedCrawler.getPost(userSession.url + filepath))
+    await postsCrawler.editPost(userArchive, filepath, post.content)
+    return massagePostRecord(await postsCrawler.getPost(userSession.url + filepath))
   },
 
   /**
@@ -125,7 +125,7 @@ module.exports = {
     var filepath = await urlToFilepath(url, userSession.url)
 
     var userArchive = dat.library.getArchive(userSession.url)
-    await feedCrawler.deletePost(userArchive, filepath)
+    await postsCrawler.deletePost(userArchive, filepath)
   }
 }
 
diff --git a/web-apis/fg/navigator-import.js b/web-apis/fg/navigator-import.js
index 8987e163..d8b5d38f 100644
--- a/web-apis/fg/navigator-import.js
+++ b/web-apis/fg/navigator-import.js
@@ -28,9 +28,9 @@ const APIs = {
     manifest: require('../manifests/external/search'),
     create: makeCreateFn('search')
   },
-  'unwalled-garden-feed': {
-    manifest: require('../manifests/external/unwalled-garden-feed'),
-    create: makeCreateFn('unwalled-garden-feed')
+  'unwalled-garden-posts': {
+    manifest: require('../manifests/external/unwalled-garden-posts'),
+    create: makeCreateFn('unwalled-garden-posts')
   },
   'unwalled-garden-followgraph': {
     manifest: require('../manifests/external/unwalled-garden-followgraph'),
diff --git a/web-apis/manifests/external/unwalled-garden-feed.js b/web-apis/manifests/external/unwalled-garden-posts.js
similarity index 100%
rename from web-apis/manifests/external/unwalled-garden-feed.js
rename to web-apis/manifests/external/unwalled-garden-posts.js

From 16ef58ec6872411487b20bea304955d15da99293 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 1 Apr 2019 12:37:46 -0500
Subject: [PATCH 132/245] Remove old constants

---
 lib/const.js | 10 ----------
 1 file changed, 10 deletions(-)

diff --git a/lib/const.js b/lib/const.js
index df113b9a..49ef9a62 100644
--- a/lib/const.js
+++ b/lib/const.js
@@ -62,13 +62,3 @@ exports.STANDARD_ARCHIVE_TYPES = [
   'videos',
   'website'
 ]
-
-// the default applications
-exports.DEFAULT_RELATIVE_DOMAIN_NAMES = {
-  start: '602dc80c3a89461d06e8a67c5ac27ef13085f42a60573a93504fa2b4746f7865',
-  feed: '602dc80c3a89461d06e8a67c5ac27ef13085f42a60573a93504fa2b4746f7865',
-  library: 'e1c19fad6334e0897e9b95e633c2eee3a13003e097d9347cbfdd184d3a144975',
-  bookmarks: 'd57fdfcf1cb81ee449c0633767f24583734ca6f7f878737007b10e35d7e0ec41',
-  profile: '602dc80c3a89461d06e8a67c5ac27ef13085f42a60573a93504fa2b4746f7865',
-  search: '602dc80c3a89461d06e8a67c5ac27ef13085f42a60573a93504fa2b4746f7865'
-}
\ No newline at end of file

From 746808afada973aee5aed2812a73f11771330b1e Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 1 Apr 2019 12:39:07 -0500
Subject: [PATCH 133/245] Switch from /data/feed to /data/posts

---
 crawler/posts.js | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/crawler/posts.js b/crawler/posts.js
index 00a23e41..c79d6b90 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -14,7 +14,7 @@ const postSchema = require('./json-schemas/post')
 
 const TABLE_VERSION = 1
 const JSON_TYPE = 'unwalled.garden/post'
-const JSON_PATH_REGEX = /^\/data\/feed\/([^/]+)\.json$/i
+const JSON_PATH_REGEX = /^\/data\/posts\/([^/]+)\.json$/i
 
 // typedefs
 // =
@@ -247,9 +247,9 @@ exports.addPost = async function (archive, content) {
   if (!valid) throw ajv.errorsText(validatePostContent.errors)
 
   var filename = generateTimeFilename()
-  var filepath = `/data/feed/${filename}.json`
+  var filepath = `/data/posts/${filename}.json`
   await ensureDirectory(archive, '/data')
-  await ensureDirectory(archive, '/data/feed')
+  await ensureDirectory(archive, '/data/posts')
   await archive.pda.writeFile(filepath, JSON.stringify({
     type: JSON_TYPE,
     content,

From a931449ef13d289898aee7c0c5b4725996eb04cf Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 1 Apr 2019 12:48:42 -0500
Subject: [PATCH 134/245] Rename the unwalled-garden-followgraph API to
 unwalled-garden-graph

---
 crawler/{followgraph.js => graph.js}          | 48 +++++++++----------
 crawler/index.js                              |  6 +--
 crawler/search.js                             | 22 ++++-----
 dbs/schemas/profile-data.sql.js               |  2 +-
 dbs/schemas/profile-data.v24.sql.js           |  2 +-
 users/index.js                                |  6 +--
 web-apis/bg.js                                |  6 +--
 ...ollowgraph.js => unwalled-garden-graph.js} | 18 +++----
 web-apis/fg/navigator-import.js               |  6 +--
 ...ollowgraph.js => unwalled-garden-graph.js} |  0
 10 files changed, 58 insertions(+), 58 deletions(-)
 rename crawler/{followgraph.js => graph.js} (88%)
 rename web-apis/bg/{unwalled-garden-followgraph.js => unwalled-garden-graph.js} (89%)
 rename web-apis/manifests/external/{unwalled-garden-followgraph.js => unwalled-garden-graph.js} (100%)

diff --git a/crawler/followgraph.js b/crawler/graph.js
similarity index 88%
rename from crawler/followgraph.js
rename to crawler/graph.js
index 2c304ea3..1a18a289 100644
--- a/crawler/followgraph.js
+++ b/crawler/graph.js
@@ -3,7 +3,7 @@ const _difference = require('lodash.difference')
 const Events = require('events')
 const {URL} = require('url')
 const Ajv = require('ajv')
-const logger = require('../logger').child({category: 'crawler', dataset: 'followgraph'})
+const logger = require('../logger').child({category: 'crawler', dataset: 'graph'})
 const lock = require('../lib/lock')
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
@@ -50,16 +50,16 @@ exports.removeListener = events.removeListener.bind(events)
  * @returns {Promise<void>}
  */
 exports.crawlSite = async function (archive, crawlSource) {
-  return doCrawl(archive, crawlSource, 'crawl_followgraph', TABLE_VERSION, async ({changes, resetRequired}) => {
+  return doCrawl(archive, crawlSource, 'crawl_graph', TABLE_VERSION, async ({changes, resetRequired}) => {
     const supressEvents = resetRequired === true // dont emit when replaying old info
     logger.silly('Crawling follows', {details: {url: archive.url, numChanges: changes.length, resetRequired}})
     if (resetRequired) {
       // reset all data
       logger.debug('Resetting dataset', {details: {url: archive.url}})
       await db.run(`
-        DELETE FROM crawl_followgraph WHERE crawlSourceId = ?
+        DELETE FROM crawl_graph WHERE crawlSourceId = ?
       `, [crawlSource.id])
-      await doCheckpoint('crawl_followgraph', TABLE_VERSION, crawlSource, 0)
+      await doCheckpoint('crawl_graph', TABLE_VERSION, crawlSource, 0)
     }
 
     // did follows.json change?
@@ -67,13 +67,13 @@ exports.crawlSite = async function (archive, crawlSource) {
     if (!change) {
       logger.debug('No change detected to follows record', {details: {url: archive.url}})
       if (changes.length) {
-        await doCheckpoint('crawl_followgraph', TABLE_VERSION, crawlSource, changes[changes.length - 1].version)
+        await doCheckpoint('crawl_graph', TABLE_VERSION, crawlSource, changes[changes.length - 1].version)
       }
       return
     }
 
     logger.verbose('Change detected to follows record', {details: {url: archive.url}})
-    emitProgressEvent(archive.url, 'crawl_followgraph', 0, 1)
+    emitProgressEvent(archive.url, 'crawl_graph', 0, 1)
 
     // read and validate
     try {
@@ -94,13 +94,13 @@ exports.crawlSite = async function (archive, crawlSource) {
     for (let add of adds) {
       try {
         await db.run(`
-          INSERT INTO crawl_followgraph (crawlSourceId, destUrl, crawledAt) VALUES (?, ?, ?)
+          INSERT INTO crawl_graph (crawlSourceId, destUrl, crawledAt) VALUES (?, ?, ?)
         `, [crawlSource.id, add, Date.now()])
       } catch (e) {
         if (e.code === 'SQLITE_CONSTRAINT') {
           // uniqueness constraint probably failed, which means we got a duplicate somehow
           // dont worry about it
-          logger.warn('Attempted to insert duplicate followgraph record', {details: {url: archive.url, add}})
+          logger.warn('Attempted to insert duplicate graph record', {details: {url: archive.url, add}})
         } else {
           throw e
         }
@@ -111,7 +111,7 @@ exports.crawlSite = async function (archive, crawlSource) {
     }
     for (let remove of removes) {
       await db.run(`
-        DELETE FROM crawl_followgraph WHERE crawlSourceId = ? AND destUrl = ?
+        DELETE FROM crawl_graph WHERE crawlSourceId = ? AND destUrl = ?
       `, [crawlSource.id, remove])
       if (supressEvents) {
         events.emit('follow-removed', archive.url, remove)
@@ -120,8 +120,8 @@ exports.crawlSite = async function (archive, crawlSource) {
 
     // write checkpoint as success
     logger.silly(`Finished crawling follows`, {details: {url: archive.url}})
-    await doCheckpoint('crawl_followgraph', TABLE_VERSION, crawlSource, changes[changes.length - 1].version)
-    emitProgressEvent(archive.url, 'crawl_followgraph', 1, 1)
+    await doCheckpoint('crawl_graph', TABLE_VERSION, crawlSource, changes[changes.length - 1].version)
+    emitProgressEvent(archive.url, 'crawl_graph', 1, 1)
   })
 }
 
@@ -145,12 +145,12 @@ const listFollowers = exports.listFollowers = async function (subject, {followed
   var rows
   if (followedBy) {
     rows = await db.all(`
-      SELECT cs.url FROM crawl_followgraph fg
+      SELECT cs.url FROM crawl_graph fg
         INNER JOIN crawl_sources cs ON cs.id = fg.crawlSourceId
         WHERE fg.destUrl = ?
           AND (cs.url = ? OR cs.url IN (
-            SELECT destUrl as url FROM crawl_followgraph
-              INNER JOIN crawl_sources ON crawl_sources.id = crawl_followgraph.crawlSourceId
+            SELECT destUrl as url FROM crawl_graph
+              INNER JOIN crawl_sources ON crawl_sources.id = crawl_graph.crawlSourceId
               WHERE crawl_sources.url = ?
           ))
         LIMIT ?
@@ -160,9 +160,9 @@ const listFollowers = exports.listFollowers = async function (subject, {followed
     rows = await db.all(`
       SELECT f.url
         FROM crawl_sources f
-        INNER JOIN crawl_followgraph
-          ON crawl_followgraph.crawlSourceId = f.id
-          AND crawl_followgraph.destUrl = ?
+        INNER JOIN crawl_graph
+          ON crawl_graph.crawlSourceId = f.id
+          AND crawl_graph.destUrl = ?
         LIMIT ?
         OFFSET ?
     `, [subject, limit, offset])
@@ -202,10 +202,10 @@ const listFollows = exports.listFollows = async function (subject, {followedBy,
   limit = limit || -1
 
   var rows = await db.all(`
-    SELECT crawl_followgraph.destUrl
-      FROM crawl_followgraph
+    SELECT crawl_graph.destUrl
+      FROM crawl_graph
       INNER JOIN crawl_sources
-        ON crawl_followgraph.crawlSourceId = crawl_sources.id
+        ON crawl_graph.crawlSourceId = crawl_sources.id
         AND crawl_sources.url = ?
       LIMIT ?
       OFFSET ?
@@ -273,9 +273,9 @@ const isAFollowingB = exports.isAFollowingB = async function (a, b) {
   var res = await db.get(`
     SELECT crawl_sources.id
       FROM crawl_sources
-      INNER JOIN crawl_followgraph
-        ON crawl_followgraph.crawlSourceId = crawl_sources.id
-        AND crawl_followgraph.destUrl = ?
+      INNER JOIN crawl_graph
+        ON crawl_graph.crawlSourceId = crawl_sources.id
+        AND crawl_graph.destUrl = ?
       WHERE crawl_sources.url = ?
   `, [b, a])
   return !!res
@@ -366,7 +366,7 @@ async function readFollowsFile (archive) {
  * @returns {Promise<void>}
  */
 async function updateFollowsFile (archive, updateFn) {
-  var release = await lock('crawler:followgraph:' + archive.url)
+  var release = await lock('crawler:graph:' + archive.url)
   try {
     // read the follows file
     try {
diff --git a/crawler/index.js b/crawler/index.js
index addbe05d..d1e52b47 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -9,7 +9,7 @@ const dat = require('../dat')
 const {crawlerEvents, toHostname} = require('./util')
 const posts = require('./posts')
 const bookmarks = require('./bookmarks')
-const followgraph = require('./followgraph')
+const graph = require('./graph')
 const siteDescriptions = require('./site-descriptions')
 
 // globals
@@ -22,7 +22,7 @@ var watches = {}
 
 exports.posts = posts
 exports.bookmarks = bookmarks
-exports.followgraph = followgraph
+exports.graph = graph
 exports.siteDescriptions = siteDescriptions
 const createEventsStream = exports.createEventsStream = () => emitStream(crawlerEvents)
 
@@ -85,7 +85,7 @@ exports.crawlSite = async function (archive) {
     await Promise.all([
       posts.crawlSite(archive, crawlSource),
       bookmarks.crawlSite(archive, crawlSource),
-      followgraph.crawlSite(archive, crawlSource),
+      graph.crawlSite(archive, crawlSource),
       siteDescriptions.crawlSite(archive, crawlSource)
     ])
   } catch (err) {
diff --git a/crawler/search.js b/crawler/search.js
index ebfabd83..62f5a536 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -4,7 +4,7 @@ const db = require('../dbs/profile-data-db')
 const bookmarksDb = require('../dbs/bookmarks')
 const historyDb = require('../dbs/history')
 const datLibrary = require('../dat/library')
-const followgraph = require('./followgraph')
+const graph = require('./graph')
 const siteDescriptions = require('./site-descriptions')
 const {getSiteDescriptionThumbnailUrl} = require('./util')
 const knex = require('../lib/knex')
@@ -193,7 +193,7 @@ exports.query = async function (user, opts) {
     // the user and all followed sources
     let res = await db.all(`
       SELECT id FROM crawl_sources src
-        INNER JOIN crawl_followgraph fgraph ON fgraph.destUrl = src.url AND fgraph.crawlSourceId = ?
+        INNER JOIN crawl_graph graph ON graph.destUrl = src.url AND graph.crawlSourceId = ?
     `, [userCrawlSourceId])
     crawlSourceIds = [userCrawlSourceId].concat(res.map(({id}) => id))
   } else if (hops === 1) {
@@ -266,7 +266,7 @@ function buildSitesSearchQuery ({query, crawlSourceIds, user, userCrawlSourceId,
     .select('crawl_sources.url AS authorUrl')
     .select('crawl_site_descriptions.crawledAt')
     .where(builder => builder
-      .whereIn('crawl_followgraph.crawlSourceId', crawlSourceIds) // description by a followed user
+      .whereIn('crawl_graph.crawlSourceId', crawlSourceIds) // description by a followed user
       .orWhere(builder => builder
         .where('crawl_site_descriptions.url', user) // about me and...
         .andWhere('crawl_site_descriptions.crawlSourceId', userCrawlSourceId) // by me
@@ -281,14 +281,14 @@ function buildSitesSearchQuery ({query, crawlSourceIds, user, userCrawlSourceId,
       .select(knex.raw(`SNIPPET(crawl_site_descriptions_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title`))
       .select(knex.raw(`SNIPPET(crawl_site_descriptions_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description`))
       .innerJoin('crawl_site_descriptions', 'crawl_site_descriptions.rowid', '=', 'crawl_site_descriptions_fts_index.rowid')
-      .leftJoin('crawl_followgraph', 'crawl_followgraph.destUrl', '=', 'crawl_site_descriptions.url')
+      .leftJoin('crawl_graph', 'crawl_graph.destUrl', '=', 'crawl_site_descriptions.url')
       .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_site_descriptions.crawlSourceId')
       .whereRaw('crawl_site_descriptions_fts_index MATCH ?', [query])
   } else {
     sql = sql
       .select('crawl_site_descriptions.title')
       .select('crawl_site_descriptions.description')
-      .leftJoin('crawl_followgraph', 'crawl_followgraph.destUrl', '=', 'crawl_site_descriptions.url')
+      .leftJoin('crawl_graph', 'crawl_graph.destUrl', '=', 'crawl_site_descriptions.url')
       .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_site_descriptions.crawlSourceId')
   }
   return sql
@@ -302,7 +302,7 @@ function buildPostsSearchQuery ({query, crawlSourceIds, userCrawlSourceId, since
     .select('crawl_posts.updatedAt')
     .select('crawl_sources.url AS authorUrl')
     .where(builder => builder
-      .whereIn('crawl_followgraph.crawlSourceId', crawlSourceIds) // published by someone I follow
+      .whereIn('crawl_graph.crawlSourceId', crawlSourceIds) // published by someone I follow
       .orWhere('crawl_posts.crawlSourceId', userCrawlSourceId) // or by me
     )
     .andWhere('crawl_posts.crawledAt', '>=', since)
@@ -314,13 +314,13 @@ function buildPostsSearchQuery ({query, crawlSourceIds, userCrawlSourceId, since
       .select(knex.raw(`SNIPPET(crawl_posts_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS body`))
       .innerJoin('crawl_posts', 'crawl_posts.rowid', '=', 'crawl_posts_fts_index.rowid')
       .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_posts.crawlSourceId')
-      .leftJoin('crawl_followgraph', 'crawl_followgraph.destUrl', '=', 'crawl_sources.url')
+      .leftJoin('crawl_graph', 'crawl_graph.destUrl', '=', 'crawl_sources.url')
       .whereRaw('crawl_posts_fts_index MATCH ?', [query])
   } else {
     sql = sql
       .select('crawl_posts.body')
       .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_posts.crawlSourceId')
-      .leftJoin('crawl_followgraph', 'crawl_followgraph.destUrl', '=', 'crawl_sources.url')
+      .leftJoin('crawl_graph', 'crawl_graph.destUrl', '=', 'crawl_sources.url')
   }
   return sql
 }
@@ -333,7 +333,7 @@ function buildBookmarksSearchQuery ({query, crawlSourceIds, userCrawlSourceId, s
     .select('crawl_bookmarks.updatedAt')
     .select('crawl_sources.url AS authorUrl')
     .where(builder => builder
-      .whereIn('crawl_followgraph.crawlSourceId', crawlSourceIds) // published by someone I follow
+      .whereIn('crawl_graph.crawlSourceId', crawlSourceIds) // published by someone I follow
       .orWhere('crawl_bookmarks.crawlSourceId', userCrawlSourceId) // or by me
     )
     .andWhere('crawl_bookmarks.crawledAt', '>=', since)
@@ -348,7 +348,7 @@ function buildBookmarksSearchQuery ({query, crawlSourceIds, userCrawlSourceId, s
       .select(knex.raw(`SNIPPET(crawl_bookmarks_fts_index, 2, '${startHighlight}', '${endHighlight}', '...', 25) AS tags`))
       .innerJoin('crawl_bookmarks', 'crawl_bookmarks.rowid', '=', 'crawl_bookmarks_fts_index.rowid')
       .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_bookmarks.crawlSourceId')
-      .leftJoin('crawl_followgraph', 'crawl_followgraph.destUrl', '=', 'crawl_sources.url')
+      .leftJoin('crawl_graph', 'crawl_graph.destUrl', '=', 'crawl_sources.url')
       .whereRaw('crawl_bookmarks_fts_index MATCH ?', [query])
   } else {
     sql = sql
@@ -357,7 +357,7 @@ function buildBookmarksSearchQuery ({query, crawlSourceIds, userCrawlSourceId, s
       .select('crawl_bookmarks.description')
       .select('crawl_bookmarks.tags')
       .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_bookmarks.crawlSourceId')
-      .leftJoin('crawl_followgraph', 'crawl_followgraph.destUrl', '=', 'crawl_sources.url')
+      .leftJoin('crawl_graph', 'crawl_graph.destUrl', '=', 'crawl_sources.url')
   }
   return sql
 }
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index b687a3b8..7ac4be74 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -213,7 +213,7 @@ CREATE TRIGGER crawl_bookmarks_au AFTER UPDATE ON crawl_bookmarks BEGIN
 END;
 
 -- crawled follows
-CREATE TABLE crawl_followgraph (
+CREATE TABLE crawl_graph (
   crawlSourceId INTEGER NOT NULL,
   crawledAt INTEGER,
   
diff --git a/dbs/schemas/profile-data.v24.sql.js b/dbs/schemas/profile-data.v24.sql.js
index 5054e18d..3af06ce2 100644
--- a/dbs/schemas/profile-data.v24.sql.js
+++ b/dbs/schemas/profile-data.v24.sql.js
@@ -113,7 +113,7 @@ CREATE TRIGGER crawl_bookmarks_au AFTER UPDATE ON crawl_bookmarks BEGIN
 END;
 
 -- crawled follows
-CREATE TABLE crawl_followgraph (
+CREATE TABLE crawl_graph (
   crawlSourceId INTEGER NOT NULL,
   crawledAt INTEGER,
   
diff --git a/users/index.js b/users/index.js
index bf4b4449..7f809f53 100644
--- a/users/index.js
+++ b/users/index.js
@@ -2,7 +2,7 @@ const Events = require('events')
 const logger = require('../logger').category('crawler')
 const dat = require('../dat')
 const crawler = require('../crawler')
-const followgraphCrawler = require('../crawler/followgraph')
+const graphCrawler = require('../crawler/graph')
 const bookmarksCrawler = require('../crawler/bookmarks')
 const db = require('../dbs/profile-data-db')
 const archivesDb = require('../dbs/archives')
@@ -253,10 +253,10 @@ async function selectNextCrawlTargets (user) {
   var rows = [user.url]
 
   // get followed sites
-  rows = rows.concat(await followgraphCrawler.listFollows(user.url))
+  rows = rows.concat(await graphCrawler.listFollows(user.url))
 
   // get sites followed by followed sites
-  rows = rows.concat(await followgraphCrawler.listFoaFs(user.url))
+  rows = rows.concat(await graphCrawler.listFoaFs(user.url))
 
   // assemble into list
   var start = user.crawlSelectorCursor || 0
diff --git a/web-apis/bg.js b/web-apis/bg.js
index da94ae95..8b05a50e 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -30,7 +30,7 @@ const libraryManifest = require('./manifests/external/library')
 const profilesManifest = require('./manifests/external/profiles')
 const searchManifest = require('./manifests/external/search')
 const postsManifest = require('./manifests/external/unwalled-garden-posts')
-const followgraphManifest = require('./manifests/external/unwalled-garden-followgraph')
+const graphManifest = require('./manifests/external/unwalled-garden-graph')
 
 // external apis
 const datArchiveAPI = require('./bg/dat-archive')
@@ -40,7 +40,7 @@ const libraryAPI = require('./bg/library')
 const profilesAPI = require('./bg/profiles')
 const searchAPI = require('./bg/search')
 const postsAPI = require('./bg/unwalled-garden-posts')
-const followgraphAPI = require('./bg/unwalled-garden-followgraph')
+const graphAPI = require('./bg/unwalled-garden-graph')
 
 // experimental manifests
 const experimentalCapturePageManifest = require('./manifests/external/experimental/capture-page')
@@ -75,7 +75,7 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('profiles', profilesManifest, profilesAPI, secureOnly)
   globals.rpcAPI.exportAPI('search', searchManifest, searchAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-posts', postsManifest, postsAPI, secureOnly)
-  globals.rpcAPI.exportAPI('unwalled-garden-followgraph', followgraphManifest, followgraphAPI, secureOnly)
+  globals.rpcAPI.exportAPI('unwalled-garden-graph', graphManifest, graphAPI, secureOnly)
 
   // experimental apis
   globals.rpcAPI.exportAPI('experimental-capture-page', experimentalCapturePageManifest, experimentalCapturePageAPI, secureOnly)
diff --git a/web-apis/bg/unwalled-garden-followgraph.js b/web-apis/bg/unwalled-garden-graph.js
similarity index 89%
rename from web-apis/bg/unwalled-garden-followgraph.js
rename to web-apis/bg/unwalled-garden-graph.js
index beffa961..cc3ebc0e 100644
--- a/web-apis/bg/unwalled-garden-followgraph.js
+++ b/web-apis/bg/unwalled-garden-graph.js
@@ -3,13 +3,13 @@ const assert = require('assert')
 const {URL} = require('url')
 const {PermissionsError} = require('beaker-error-constants')
 const dat = require('../../dat')
-const followgraphCrawler = require('../../crawler/followgraph')
+const graphCrawler = require('../../crawler/graph')
 
 // typedefs
 // =
 
 /**
- * @typedef {Object} FollowgraphSitePublicAPIRecord
+ * @typedef {Object} GraphSitePublicAPIRecord
  * @prop {string} url
  * @prop {string} title
  * @prop {string} description
@@ -27,7 +27,7 @@ module.exports = {
    * @param {string} [opts.filters.followedBy]
    * @param {number} [opts.offset]
    * @param {number} [opts.limit]
-   * @returns {Promise<FollowgraphSitePublicAPIRecord[]>}
+   * @returns {Promise<GraphSitePublicAPIRecord[]>}
    */
   async listFollowers (url, opts) {
     await assertPermission(this.sender, 'dangerousAppControl')
@@ -52,7 +52,7 @@ module.exports = {
     }
 
     query.includeDesc = true
-    var followers = await followgraphCrawler.listFollowers(url, query)
+    var followers = await graphCrawler.listFollowers(url, query)
     return followers.map(massageSiteRecord)
   },
 
@@ -63,7 +63,7 @@ module.exports = {
    * @param {string} [opts.filters.followedBy]
    * @param {number} [opts.offset]
    * @param {number} [opts.limit]
-   * @returns {Promise<FollowgraphSitePublicAPIRecord[]>}
+   * @returns {Promise<GraphSitePublicAPIRecord[]>}
    */
   async listFollows (url, opts) {
     await assertPermission(this.sender, 'dangerousAppControl')
@@ -88,7 +88,7 @@ module.exports = {
     }
 
     query.includeDesc = true
-    var follows = await followgraphCrawler.listFollows(url, query)
+    var follows = await graphCrawler.listFollows(url, query)
     return follows.map(massageSiteRecord)
   },
 
@@ -106,7 +106,7 @@ module.exports = {
     assert(a, 'The `a` parameter must be a valid URL')
     assert(b, 'The `b` parameter must be a valid URL')
 
-    return followgraphCrawler.isAFollowingB(a, b)
+    return graphCrawler.isAFollowingB(a, b)
   },
 
   /**
@@ -123,7 +123,7 @@ module.exports = {
     if (!userSession) throw new Error('No active user session')
     var userArchive = dat.library.getArchive(userSession.url)
 
-    await followgraphCrawler.follow(userArchive, url)
+    await graphCrawler.follow(userArchive, url)
   },
 
   /**
@@ -140,7 +140,7 @@ module.exports = {
     if (!userSession) throw new Error('No active user session')
     var userArchive = dat.library.getArchive(userSession.url)
 
-    await followgraphCrawler.unfollow(userArchive, url)
+    await graphCrawler.unfollow(userArchive, url)
   }
 }
 
diff --git a/web-apis/fg/navigator-import.js b/web-apis/fg/navigator-import.js
index d8b5d38f..69427e2e 100644
--- a/web-apis/fg/navigator-import.js
+++ b/web-apis/fg/navigator-import.js
@@ -32,9 +32,9 @@ const APIs = {
     manifest: require('../manifests/external/unwalled-garden-posts'),
     create: makeCreateFn('unwalled-garden-posts')
   },
-  'unwalled-garden-followgraph': {
-    manifest: require('../manifests/external/unwalled-garden-followgraph'),
-    create: makeCreateFn('unwalled-garden-followgraph')
+  'unwalled-garden-graph': {
+    manifest: require('../manifests/external/unwalled-garden-graph'),
+    create: makeCreateFn('unwalled-garden-graph')
   }
 }
 
diff --git a/web-apis/manifests/external/unwalled-garden-followgraph.js b/web-apis/manifests/external/unwalled-garden-graph.js
similarity index 100%
rename from web-apis/manifests/external/unwalled-garden-followgraph.js
rename to web-apis/manifests/external/unwalled-garden-graph.js

From 48bc710db6a8656b6569d6d0ec687a1438cd4965 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 1 Apr 2019 13:11:14 -0500
Subject: [PATCH 135/245] Update bookmark records to use tag arrays

---
 crawler/bookmarks.js             | 11 ++++++-----
 crawler/json-schemas/bookmark.js | 13 +++++++++----
 crawler/json-schemas/comment.js  | 12 ++++++------
 crawler/json-schemas/follows.js  |  4 ++--
 crawler/json-schemas/post.js     |  8 ++++----
 crawler/search.js                |  4 ++--
 users/index.js                   |  1 -
 web-apis/bg/bookmarks.js         |  1 -
 8 files changed, 29 insertions(+), 25 deletions(-)

diff --git a/crawler/bookmarks.js b/crawler/bookmarks.js
index 6342acff..7db50276 100644
--- a/crawler/bookmarks.js
+++ b/crawler/bookmarks.js
@@ -30,7 +30,7 @@ const JSON_PATH_REGEX = /^\/data\/bookmarks\/([^/]+)\.json$/i
  * @prop {string} content.href
  * @prop {string} content.title
  * @prop {string?} content.description
- * @prop {string?} content.tags
+ * @prop {string[]?} content.tags
  * @prop {number} crawledAt
  * @prop {number} createdAt
  * @prop {number} updatedAt
@@ -121,7 +121,8 @@ exports.crawlSite = async function (archive, crawlSource) {
         bookmark.updatedAt = Number(new Date(bookmark.updatedAt))
         if (isNaN(bookmark.updatedAt)) bookmark.updatedAt = 0 // optional
         if (!bookmark.content.description) bookmark.content.description = '' // optional
-        if (!bookmark.content.tags) bookmark.content.tags = '' // optional
+        if (!bookmark.content.tags) bookmark.content.tags = [] // optional
+        bookmark.content.tags = bookmark.content.tags.join(' ')
 
         // upsert
         let existingBookmark = await getBookmark(joinPath(archive.url, changedBookmark.name))
@@ -251,7 +252,7 @@ const getBookmark = exports.getBookmark = async function (url) {
  * @returns {Promise<string>} url
  */
 exports.addBookmark = async function (archive, content) {
-  if (content && Array.isArray(content.tags)) content.tags = content.tags.join(' ')
+  if (content && typeof content.tags === 'string') content.tags = content.tags.split(' ')
   var valid = validateBookmarkContent(content)
   if (!valid) throw ajv.errorsText(validateBookmarkContent.errors)
 
@@ -282,7 +283,7 @@ exports.addBookmark = async function (archive, content) {
  * @returns {Promise<void>}
  */
 exports.editBookmark = async function (archive, pathname, content) {
-  if (content && Array.isArray(content.tags)) content.tags = content.tags.join(' ')
+  if (content && typeof content.tags === 'string') content.tags = content.tags.split(' ')
   var valid = validateBookmarkContent(content)
   if (!valid) throw ajv.errorsText(validateBookmarkContent.errors)
   var oldJson = JSON.parse(await archive.pda.readFile(pathname))
@@ -364,7 +365,7 @@ async function massageBookmarkRow (row) {
       href: row.href,
       title: row.title,
       description: row.description,
-      tags: row.tags
+      tags: row.tags.split(' ')
     },
     crawledAt: row.crawledAt,
     createdAt: row.createdAt,
diff --git a/crawler/json-schemas/bookmark.js b/crawler/json-schemas/bookmark.js
index 0f574cda..b215c46f 100644
--- a/crawler/json-schemas/bookmark.js
+++ b/crawler/json-schemas/bookmark.js
@@ -8,7 +8,7 @@ module.exports = {
   'properties': {
     'type': {
       'type': 'string',
-      'title': "The object's type",
+      'description': "The object's type",
       'const': 'unwalled.garden/bookmark'
     },
     'content': {
@@ -20,7 +20,8 @@ module.exports = {
           'format': 'uri',
           'examples': [
             'dat://beakerbrowser.com'
-          ]
+          ],
+          'maxLength': 10000
         },
         'title': {
           'type': 'string',
@@ -31,8 +32,12 @@ module.exports = {
           'maxLength': 560
         },
         'tags': {
-          'type': 'string',
-          'maxLength': 280
+          'type': 'array',
+          'items': {
+            'type': 'string',
+            'maxLength': 100,
+            'pattern': '^[A-Za-z][A-Za-z0-9-_?]*$'
+          }
         }
       }
     },
diff --git a/crawler/json-schemas/comment.js b/crawler/json-schemas/comment.js
index 73a62282..c28578f0 100644
--- a/crawler/json-schemas/comment.js
+++ b/crawler/json-schemas/comment.js
@@ -13,12 +13,12 @@ module.exports = {
   'properties': {
     'type': {
       'type': 'string',
-      'title': "The object's type",
+      'description': "The object's type",
       'const': 'unwalled.garden/comment'
     },
     'topic': {
       'type': 'string',
-      'title': 'What this comment is about',
+      'description': 'What this comment is about',
       'format': 'uri',
       'examples': [
         'dat://beakerbrowser.com'
@@ -26,7 +26,7 @@ module.exports = {
     },
     'replyTo': {
       'type': 'string',
-      'title': 'What this comment is replying to',
+      'description': 'What this comment is replying to',
       'format': 'uri',
       'examples': [
         'dat://beakerbrowser.com'
@@ -38,19 +38,19 @@ module.exports = {
       'properties': {
         'body': {
           'type': 'string',
-          'title': "The post's text content"
+          'description': "The post's text content"
         }
       }
     },
     'createdAt': {
       'type': 'string',
       'format': 'date-time',
-      'title': "The time of this post's creation"
+      'description': "The time of this post's creation"
     },
     'updatedAt': {
       'type': 'string',
       'format': 'date-time',
-      'title': "The time of this post's last edit"
+      'description': "The time of this post's last edit"
     }
   },
   'additionalProperties': false
diff --git a/crawler/json-schemas/follows.js b/crawler/json-schemas/follows.js
index 62f38d53..28e1910d 100644
--- a/crawler/json-schemas/follows.js
+++ b/crawler/json-schemas/follows.js
@@ -11,12 +11,12 @@ module.exports = {
   'properties': {
     'type': {
       'type': 'string',
-      'title': "The object's type",
+      'description': "The object's type",
       'const': 'unwalled.garden/follows'
     },
     'urls': {
       'type': 'array',
-      'title': 'The followed URLs',
+      'description': 'The followed URLs',
       'items': {
         'type': 'string',
         'format': 'uri',
diff --git a/crawler/json-schemas/post.js b/crawler/json-schemas/post.js
index 08a5ee85..17a31ade 100644
--- a/crawler/json-schemas/post.js
+++ b/crawler/json-schemas/post.js
@@ -8,7 +8,7 @@ module.exports = {
   'properties': {
     'type': {
       'type': 'string',
-      'title': "The object's type",
+      'description': "The object's type",
       'const': 'unwalled.garden/post'
     },
     'content': {
@@ -17,7 +17,7 @@ module.exports = {
       'properties': {
         'body': {
           'type': 'string',
-          'title': "The post's text body",
+          'description': "The post's text body",
           'maxLength': 280
         }
       }
@@ -25,12 +25,12 @@ module.exports = {
     'createdAt': {
       'type': 'string',
       'format': 'date-time',
-      'title': "The time of this post's creation"
+      'description': "The time of this post's creation"
     },
     'updatedAt': {
       'type': 'string',
       'format': 'date-time',
-      'title': "The time of this post's last edit"
+      'description': "The time of this post's last edit"
     }
   }
 }
\ No newline at end of file
diff --git a/crawler/search.js b/crawler/search.js
index 62f5a536..90beca69 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -78,7 +78,7 @@ const BUILTIN_PAGES = [
  * @prop {string} content.href
  * @prop {string} content.title
  * @prop {string} content.description
- * @prop {string} content.tags
+ * @prop {string[]} content.tags
  * @prop {number} createdAt
  * @prop {number} updatedAt
  */
@@ -446,7 +446,7 @@ async function massageBookmarkSearchResult (row) {
       href: row.href,
       title: row.title,
       description: row.description,
-      tags: row.tags
+      tags: row.tags.split(' ')
     },
     createdAt: row.createdAt,
     updatedAt: row.updatedAt
diff --git a/users/index.js b/users/index.js
index 7f809f53..0a4f157c 100644
--- a/users/index.js
+++ b/users/index.js
@@ -339,7 +339,6 @@ function watchAndSyncBookmarks (user) {
 
     // diff and publish changes
     for (let b of publicBookmarks) {
-      b.tags = b.tags.join(' ')
       let existing = publishedBookmarks.find(b2 => b.href === b2.content.href)
       if (!existing) {
         await bookmarksCrawler.addBookmark(user.archive, pickBookmarkAttrs(b)) // add
diff --git a/web-apis/bg/bookmarks.js b/web-apis/bg/bookmarks.js
index 09f6c084..b32542ac 100644
--- a/web-apis/bg/bookmarks.js
+++ b/web-apis/bg/bookmarks.js
@@ -210,7 +210,6 @@ function normalizeInternalBookmark (bookmark, user) {
 
 function normalizeUWBookmark (uwBookmark, user, pinneds) {
   var bookmark = uwBookmark.content
-  bookmark.tags = bookmark.tags.split(' ').filter(Boolean)
   bookmark.public = true
   bookmark.author = uwBookmark.author
   bookmark.isOwner = bookmark.author.url === user.url

From fe9c96d34acbbd24087a4edee65058f4ed7b6dc3 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 1 Apr 2019 13:23:51 -0500
Subject: [PATCH 136/245] Switch bookmark.public to bookmark.isPublic to avoid
 JS parsing issues

---
 dbs/bookmarks.js                    | 32 ++++++++++++++---------------
 dbs/schemas/profile-data.sql.js     |  2 +-
 dbs/schemas/profile-data.v24.sql.js |  2 +-
 users/index.js                      |  2 +-
 web-apis/bg/bookmarks.js            | 12 +++++------
 5 files changed, 25 insertions(+), 25 deletions(-)

diff --git a/dbs/bookmarks.js b/dbs/bookmarks.js
index 8372eaaa..3ef10f4b 100644
--- a/dbs/bookmarks.js
+++ b/dbs/bookmarks.js
@@ -23,7 +23,7 @@ const NORMALIZE_OPTS = {
  * @prop {string} description
  * @prop {string[]} tags
  * @prop {boolean} pinned
- * @prop {boolean} public
+ * @prop {boolean} isPublic
  * @prop {number} pinOrder
  */
 
@@ -47,10 +47,10 @@ exports.removeListener = events.removeListener.bind(events)
  * @param {string} [values.description]
  * @param {string | string[]} [values.tags]
  * @param {boolean} [values.pinned]
- * @param {boolean} [values.public]
+ * @param {boolean} [values.isPublic]
  * @returns {Promise<void>}
  */
-exports.addBookmark = async function (profileId, {href, title, description, tags, pinned, public} = {}) {
+exports.addBookmark = async function (profileId, {href, title, description, tags, pinned, isPublic} = {}) {
   // validate
   assertValidHref(href)
   assertValidTitle(title)
@@ -61,16 +61,16 @@ exports.addBookmark = async function (profileId, {href, title, description, tags
   href = normalizeUrl(href, NORMALIZE_OPTS)
   var tagsStr = tagsToString(tags)
   description = description || ''
-  public = public || false
+  isPublic = isPublic || false
 
   // update record
   var release = await lock(`bookmarksdb`)
   try {
     await db.run(`
       INSERT OR REPLACE
-        INTO bookmarks (profileId, url, title, description, tags, pinned, public)
+        INTO bookmarks (profileId, url, title, description, tags, pinned, isPublic)
         VALUES (?, ?, ?, ?, ?, ?, ?)
-    `, [profileId, href, title, description, tagsStr, Number(pinned), Number(public)])
+    `, [profileId, href, title, description, tagsStr, Number(pinned), Number(isPublic)])
     events.emit('changed')
   } finally {
     release()
@@ -86,10 +86,10 @@ exports.addBookmark = async function (profileId, {href, title, description, tags
  * @param {string} [values.description]
  * @param {string | string[]} [values.tags]
  * @param {boolean} [values.pinned]
- * @param {boolean} [values.public]
+ * @param {boolean} [values.isPublic]
  * @returns {Promise<void>}
  */
-exports.editBookmark = async function (profileId, bookmarkHref, {href, title, description, tags, pinned, public} = {}) {
+exports.editBookmark = async function (profileId, bookmarkHref, {href, title, description, tags, pinned, isPublic} = {}) {
   // validate
   assertValidHref(bookmarkHref)
   if (href) assertValidHref(href)
@@ -116,15 +116,15 @@ exports.editBookmark = async function (profileId, bookmarkHref, {href, title, de
       if (typeof description !== 'undefined') sql = sql.update('description', description)
       if (typeof tagsStr !== 'undefined') sql = sql.update('tags', tagsStr)
       if (typeof pinned !== 'undefined') sql = sql.update('pinned', Number(pinned))
-      if (typeof public !== 'undefined') sql = sql.update('public', Number(public))
+      if (typeof isPublic !== 'undefined') sql = sql.update('isPublic', Number(isPublic))
       await db.run(sql)
     } else {
       // insert record
       await db.run(`
         INSERT OR REPLACE
-          INTO bookmarks (profileId, url, title, description, tags, pinned, public)
+          INTO bookmarks (profileId, url, title, description, tags, pinned, isPublic)
           VALUES (?, ?, ?, ?, ?, ?, ?)
-      `, [profileId, href, title, description || '', tagsStr, Number(pinned), Number(public)])
+      `, [profileId, href, title, description || '', tagsStr, Number(pinned), Number(isPublic)])
     }
     events.emit('changed')
   } finally {
@@ -180,7 +180,7 @@ exports.getBookmark = async function (profileId, href) {
  * @param {Object} [opts]
  * @param {Object} [opts.filters]
  * @param {boolean} [opts.filters.pinned]
- * @param {boolean} [opts.filters.public]
+ * @param {boolean} [opts.filters.isPublic]
  * @returns {Promise<Array<Bookmark>>}
  */
 exports.listBookmarks = async function (profileId, {filters} = {}) {
@@ -190,7 +190,7 @@ exports.listBookmarks = async function (profileId, {filters} = {}) {
     .select('description')
     .select('tags')
     .select('pinned')
-    .select('public')
+    .select('isPublic')
     .select('pinOrder')
     .select('createdAt')
     .where('profileId', '=', profileId)
@@ -198,8 +198,8 @@ exports.listBookmarks = async function (profileId, {filters} = {}) {
   if (filters && filters.pinned) {
     sql = sql.where('pinned', '=', '1')
   }
-  if (filters && 'public' in filters) {
-    sql = sql.where('public', '=', filters.public ? '1' : '0')
+  if (filters && 'isPublic' in filters) {
+    sql = sql.where('isPublic', '=', filters.isPublic ? '1' : '0')
   }
 
   var bookmarks = await db.all(sql)
@@ -248,7 +248,7 @@ function toNewFormat (b) {
     description: b.description,
     tags: b.tags ? b.tags.split(' ').filter(Boolean) : [],
     pinned: !!b.pinned,
-    public: !!b.public,
+    isPublic: !!b.isPublic,
     pinOrder: b.pinOrder
   }
 }
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index 7ac4be74..b0766f48 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -58,7 +58,7 @@ CREATE TABLE bookmarks (
   url TEXT NOT NULL,
   title TEXT,
   description TEXT,
-  public INTEGER,
+  isPublic INTEGER,
   pinned INTEGER,
   pinOrder INTEGER DEFAULT 0,
   createdAt INTEGER DEFAULT (strftime('%s', 'now')),
diff --git a/dbs/schemas/profile-data.v24.sql.js b/dbs/schemas/profile-data.v24.sql.js
index 3af06ce2..cfa37cca 100644
--- a/dbs/schemas/profile-data.v24.sql.js
+++ b/dbs/schemas/profile-data.v24.sql.js
@@ -4,7 +4,7 @@ module.exports = `
 ALTER TABLE bookmarks ADD COLUMN description TEXT;
 
 -- sync the bookmark to the user's public profile
-ALTER TABLE bookmarks ADD COLUMN public INTEGER;
+ALTER TABLE bookmarks ADD COLUMN isPublic INTEGER;
 
 CREATE TABLE users (
   id INTEGER PRIMARY KEY NOT NULL,
diff --git a/users/index.js b/users/index.js
index 0a4f157c..02df9e0f 100644
--- a/users/index.js
+++ b/users/index.js
@@ -334,7 +334,7 @@ function watchAndSyncBookmarks (user) {
 
   async function syncBookmarks () {
     // fetch current public bookmarks
-    var publicBookmarks = await bookmarksDb.listBookmarks(0, {filters: {public: true}})
+    var publicBookmarks = await bookmarksDb.listBookmarks(0, {filters: {isPublic: true}})
     var publishedBookmarks = await bookmarksCrawler.query({filters: {authors: user.url}})
 
     // diff and publish changes
diff --git a/web-apis/bg/bookmarks.js b/web-apis/bg/bookmarks.js
index b32542ac..792bf1e9 100644
--- a/web-apis/bg/bookmarks.js
+++ b/web-apis/bg/bookmarks.js
@@ -24,7 +24,7 @@ const _get = require('lodash.get')
  * @prop {string} description
  * @prop {string[]} tags
  * @prop {boolean} pinned
- * @prop {boolean} public
+ * @prop {boolean} isPublic
  * @prop {boolean} isOwner
  * @prop {number} pinOrder
  */
@@ -39,7 +39,7 @@ module.exports = {
    * @param {string|string[]} [opts.filters.authors]
    * @param {string|string[]} [opts.filters.tag]
    * @param {boolean} [opts.filters.pinned]
-   * @param {boolean} [opts.filters.public]
+   * @param {boolean} [opts.filters.isPublic]
    * @returns {Promise<BookmarkPublicAPIRecord[]>}
    */
   async query (opts) {
@@ -53,7 +53,7 @@ module.exports = {
     // massage params
     var tagFilter = _get(opts, 'filters.tag', undefined)
     var pinnedFilter = _get(opts, 'filters.pinned', undefined)
-    var publicFilter = _get(opts, 'filters.public', undefined)
+    var publicFilter = _get(opts, 'filters.isPublic', undefined)
     var authorsFilter = _get(opts, 'filters.authors', undefined)
     if (authorsFilter) {
       if (!Array.isArray(authorsFilter)) authorsFilter = [authorsFilter]
@@ -147,7 +147,7 @@ module.exports = {
    * @param {string} [data.description]
    * @param {string | string[]} [data.tags]
    * @param {boolean} [data.pinned]
-   * @param {boolean} [data.public]
+   * @param {boolean} [data.isPublic]
    * @returns {Promise<void>}
    */
   async add (data) {
@@ -163,7 +163,7 @@ module.exports = {
    * @param {string} [data.description]
    * @param {string | string[]} [data.tags]
    * @param {boolean} [data.pinned]
-   * @param {boolean} [data.public]
+   * @param {boolean} [data.isPublic]
    * @returns {Promise<void>}
    */
   async edit (href, data = {}) {
@@ -210,7 +210,7 @@ function normalizeInternalBookmark (bookmark, user) {
 
 function normalizeUWBookmark (uwBookmark, user, pinneds) {
   var bookmark = uwBookmark.content
-  bookmark.public = true
+  bookmark.isPublic = true
   bookmark.author = uwBookmark.author
   bookmark.isOwner = bookmark.author.url === user.url
   bookmark.pinned = bookmark.isOwner && pinneds.find(p => p.href === bookmark.href)

From 351528c7ae642127f12600588c4a04bf2ce07b06 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 2 Apr 2019 13:20:55 -0500
Subject: [PATCH 137/245] Include missing 'createdAt' attribute in bookmarks
 API

---
 web-apis/bg/bookmarks.js | 1 +
 1 file changed, 1 insertion(+)

diff --git a/web-apis/bg/bookmarks.js b/web-apis/bg/bookmarks.js
index 792bf1e9..859cbe74 100644
--- a/web-apis/bg/bookmarks.js
+++ b/web-apis/bg/bookmarks.js
@@ -210,6 +210,7 @@ function normalizeInternalBookmark (bookmark, user) {
 
 function normalizeUWBookmark (uwBookmark, user, pinneds) {
   var bookmark = uwBookmark.content
+  bookmark.createdAt = uwBookmark.createdAt
   bookmark.isPublic = true
   bookmark.author = uwBookmark.author
   bookmark.isOwner = bookmark.author.url === user.url

From 3f76ca77528e2acf844a7ba1e730483aea893f28 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 2 Apr 2019 13:37:41 -0500
Subject: [PATCH 138/245] Filter out empty tags from bookmarks

---
 crawler/bookmarks.js | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/crawler/bookmarks.js b/crawler/bookmarks.js
index 7db50276..39d8fbf2 100644
--- a/crawler/bookmarks.js
+++ b/crawler/bookmarks.js
@@ -365,7 +365,7 @@ async function massageBookmarkRow (row) {
       href: row.href,
       title: row.title,
       description: row.description,
-      tags: row.tags.split(' ')
+      tags: row.tags.split(' ').filter(Boolean)
     },
     crawledAt: row.crawledAt,
     createdAt: row.createdAt,

From cc46c5c856dfcf11bb84c10b705fd53020076348 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 5 Apr 2019 10:23:25 -0500
Subject: [PATCH 139/245] Update crawler suggestions

---
 crawler/search.js | 62 +++++++++++++++++++++++------------------------
 1 file changed, 30 insertions(+), 32 deletions(-)

diff --git a/crawler/search.js b/crawler/search.js
index 90beca69..3c3f5292 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -11,10 +11,10 @@ const knex = require('../lib/knex')
 
 /** @type {Array<Object>} */
 const BUILTIN_PAGES = [
-  // {title: 'Timeline', url: 'beaker://timeline'}, DISABLED -prf
-  {title: 'Your Library', url: 'beaker://library'},
+  {title: 'Address book', url: 'beaker://library/?view=addressbook'},
+  {title: 'Bookmarks', url: 'beaker://library/?view=bookmarks'},
+  {title: 'Websites', url: 'beaker://library/?view=websites'},
   {title: 'Search', url: 'beaker://search'},
-  {title: 'Bookmarks', url: 'beaker://bookmarks'},
   {title: 'History', url: 'beaker://history'},
   {title: 'Watchlist', url: 'beaker://watchlist'},
   {title: 'Downloads', url: 'beaker://downloads'},
@@ -29,13 +29,10 @@ const BUILTIN_PAGES = [
  * @typedef {import("../dbs/archives").LibraryArchiveRecord} LibraryArchiveRecord
  *
  * @typedef {Object} SuggestionResults
- * @prop {Array<Object>} apps
- * @prop {Array<Object>} people
- * @prop {Array<Object>} webPages
- * @prop {Array<Object>} fileShares
- * @prop {Array<Object>} imageCollections
- * @prop {Array<Object>} others
- * @prop {(undefined|Array<Object>)} bookmarks
+ * @prop {Array<Object>} builtins
+ * @prop {Array<Object>} addressbook
+ * @prop {Array<Object>} bookmarks
+ * @prop {Array<Object>} websites
  * @prop {(undefined|Array<Object>)} history
  *
  * TODO: define the SuggestionResults values
@@ -90,39 +87,40 @@ const BUILTIN_PAGES = [
  * @description
  * Get suggested content of various types.
  *
+ * @param {string} user - The current user's URL.
  * @param {string} [query=''] - The search query.
  * @param {Object} [opts={}]
  * @param {boolean} [opts.filterPins] - If true, will filter out pinned bookmarks.
  * @returns {Promise<SuggestionResults>}
  */
-exports.listSuggestions = async function (query = '', opts = {}) {
+exports.listSuggestions = async function (user, query = '', opts = {}) {
   var suggestions = {}
-  const filterFn = a => ((a.url || a.href).includes(query) || a.title.toLowerCase().includes(query))
+  const filterFn = a => query ? ((a.url || a.href).includes(query) || a.title.toLowerCase().includes(query)) : true
 
   // builtin pages
-  suggestions.apps = BUILTIN_PAGES.filter(filterFn)
+  suggestions.builtins = BUILTIN_PAGES.filter(a => query ? a.title.toLowerCase().includes(query) : true)
 
-  // library
-  var libraryResults = /** @type LibraryArchiveRecord[] */(await datLibrary.queryArchives({isSaved: true}))
-  libraryResults = libraryResults.filter(filterFn)
-  var libraryResultsGrouped = _groupBy(libraryResults, a => 'todo') //getBasicType(a.type))
-  suggestions.people = libraryResultsGrouped.user
-  suggestions.webPages = libraryResultsGrouped['web-page']
-  suggestions.fileShares = libraryResultsGrouped['file-share']
-  suggestions.imageCollections = libraryResultsGrouped['image-collection']
-  suggestions.others = libraryResultsGrouped.other
+  // addressbook
+  suggestions.addressbook = await graph.listFollows(user, {includeDesc: true})
+  suggestions.addressbook = [await siteDescriptions.getBest({subject: user, author: user})].concat(suggestions.addressbook)
+  suggestions.addressbook = suggestions.addressbook.filter(filterFn)
 
-  if (query) {
-    // bookmarks
-    var bookmarkResults = await bookmarksDb.listBookmarks(0)
-    if (opts.filterPins) {
-      bookmarkResults = bookmarkResults.filter(b => !b.pinned && filterFn(b))
-    } else {
-      bookmarkResults = bookmarkResults.filter(filterFn)
-    }
-    bookmarkResults = bookmarkResults.slice(0, 12)
-    suggestions.bookmarks = bookmarkResults.map(b => ({title: b.title, url: b.href}))
+  // bookmarks
+  var bookmarkResults = await bookmarksDb.listBookmarks(0)
+  if (opts.filterPins) {
+    bookmarkResults = bookmarkResults.filter(b => !b.pinned && filterFn(b))
+  } else {
+    bookmarkResults = bookmarkResults.filter(filterFn)
+  }
+  bookmarkResults = bookmarkResults.slice(0, 12)
+  suggestions.bookmarks = bookmarkResults.map(b => ({title: b.title, url: b.href}))
+
+  // websites
+  suggestions.websites = /** @type LibraryArchiveRecord[] */(await datLibrary.queryArchives({isSaved: true}))
+  suggestions.websites = suggestions.websites.filter(w => w.url !== user) // filter out the user's site
+  suggestions.websites = suggestions.websites.filter(filterFn)
 
+  if (query) {
     // history
     var historyResults = await historyDb.search(query)
     suggestions.history = historyResults.slice(0, 12)

From 1b5c5632e086ce2ab23d014442b18d37a057b547 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 5 Apr 2019 10:23:34 -0500
Subject: [PATCH 140/245] Bump deps

---
 package-lock.json | 191 +++++++++++++++++++++++++---------------------
 package.json      |  24 +++---
 2 files changed, 117 insertions(+), 98 deletions(-)

diff --git a/package-lock.json b/package-lock.json
index 4981665f..5b6b1fd0 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -14,9 +14,9 @@
       }
     },
     "@beaker/dat-ephemeral-ext-msg": {
-      "version": "1.0.1",
-      "resolved": "https://registry.npmjs.org/@beaker/dat-ephemeral-ext-msg/-/dat-ephemeral-ext-msg-1.0.1.tgz",
-      "integrity": "sha512-/dsoa8e2QchRKou7vSA4RtYmMNDzb9QttRujbxYz6chvtmLpu4LK52rzIPIYeiKI6YMj0PUJZ1J6Jh6a0+UpMw==",
+      "version": "1.0.2",
+      "resolved": "https://registry.npmjs.org/@beaker/dat-ephemeral-ext-msg/-/dat-ephemeral-ext-msg-1.0.2.tgz",
+      "integrity": "sha512-LfuokfkHB4HnHEYxdQS8ulNEVhhixviYGN8CXo1JCuNC9LdtzMVvsggD+aMiZ73MtoBYuDY6bwTpfAEHDlCxkQ==",
       "requires": {
         "protocol-buffers-encodings": "^1.1.0"
       }
@@ -356,9 +356,9 @@
       }
     },
     "binary-extensions": {
-      "version": "1.12.0",
-      "resolved": "https://registry.npmjs.org/binary-extensions/-/binary-extensions-1.12.0.tgz",
-      "integrity": "sha512-DYWGk01lDcxeS/K9IHPGWfT8PsJmbXRtRd2Sx72Tnb8pcYZQFF1oSDb8hJtS1vhp212q1Rzi5dUf9+nq0o9UIg=="
+      "version": "1.13.1",
+      "resolved": "https://registry.npmjs.org/binary-extensions/-/binary-extensions-1.13.1.tgz",
+      "integrity": "sha512-Un7MIEDdUC5gNpcGDV97op1Ywk748MpHcFTHoYs6qnj1Z3j7I53VG3nwZhKzoBZmbdRNnb6WRdFlwl7tSDuZGw=="
     },
     "bitfield-rle": {
       "version": "2.2.1",
@@ -482,7 +482,7 @@
     },
     "buffer-equals": {
       "version": "1.0.4",
-      "resolved": "http://registry.npmjs.org/buffer-equals/-/buffer-equals-1.0.4.tgz",
+      "resolved": "https://registry.npmjs.org/buffer-equals/-/buffer-equals-1.0.4.tgz",
       "integrity": "sha1-A1O1T9B/2VZBcGca5vZrnPENJ/U="
     },
     "buffer-fill": {
@@ -506,9 +506,9 @@
       }
     },
     "bytes": {
-      "version": "3.0.0",
-      "resolved": "https://registry.npmjs.org/bytes/-/bytes-3.0.0.tgz",
-      "integrity": "sha1-0ygVQE1olpn4Wk6k+odV3ROpYEg="
+      "version": "3.1.0",
+      "resolved": "https://registry.npmjs.org/bytes/-/bytes-3.1.0.tgz",
+      "integrity": "sha512-zauLjrfCG+xvoyaqLoV8bLVXXNGC4JqlxFCutSDWA6fJrTo2ZuvLYTqZ7aHBLZSMOopbzwv8f+wZcVzfVTI2Dg=="
     },
     "cache-base": {
       "version": "1.0.1",
@@ -805,9 +805,9 @@
       }
     },
     "dat-dns": {
-      "version": "3.2.0",
-      "resolved": "https://registry.npmjs.org/dat-dns/-/dat-dns-3.2.0.tgz",
-      "integrity": "sha512-3U17SGiMgSflp0CnqMxoOkyNPZF93q/ieITIjogmWc/gVwZ/z0PgAALgPxrwmebxf8rYCPukVRWfue/8F9PRMg==",
+      "version": "3.2.1",
+      "resolved": "https://registry.npmjs.org/dat-dns/-/dat-dns-3.2.1.tgz",
+      "integrity": "sha512-gCfU2FBg41Qg7RgqYBRD3bjYWAaJFO6UvKfCU9SA1LBy6vZ3EoTZH5doCYdTTQmVEsAxMef18W0lnvr1Z7rx0g==",
       "requires": {
         "call-me-maybe": "^1.0.1",
         "concat-stream": "^1.6.0",
@@ -980,12 +980,12 @@
       }
     },
     "discovery-swarm": {
-      "version": "5.1.3",
-      "resolved": "https://registry.npmjs.org/discovery-swarm/-/discovery-swarm-5.1.3.tgz",
-      "integrity": "sha512-JmwQNNvf6fZUiuUOpksv5aKTkWONlxZD4l3TuFwqibZYcoQfIhsVSQOodalJIzRQxCKgXAkMrh6aH3JzkOv1kw==",
+      "version": "5.1.4",
+      "resolved": "https://registry.npmjs.org/discovery-swarm/-/discovery-swarm-5.1.4.tgz",
+      "integrity": "sha512-vkg0bv+FUwSuPxBWzdNPQVNmXQlIbvz1Ygi+A1XefNUhEzfmM+RNndjtjlDgxD/ZUhFir9PX7Hw9iIDVujsOoA==",
       "requires": {
         "connections": "^1.4.2",
-        "debug": "^3.1.0",
+        "debug": "^4.1.1",
         "discovery-channel": "^5.5.1",
         "length-prefixed-message": "^3.0.3",
         "pump": "^3.0.0",
@@ -994,9 +994,9 @@
       },
       "dependencies": {
         "debug": {
-          "version": "3.2.6",
-          "resolved": "https://registry.npmjs.org/debug/-/debug-3.2.6.tgz",
-          "integrity": "sha512-mel+jf7nrtEl5Pn1Qx46zARXKDpBbvzezse7p7LqINmdoIk8PYP5SySaxEmYv6TZ0JyEKA1hsCId6DIhgITtWQ==",
+          "version": "4.1.1",
+          "resolved": "https://registry.npmjs.org/debug/-/debug-4.1.1.tgz",
+          "integrity": "sha512-pYAIzeRo8J6KPEaJ0VWOh5Pzkbw/RetuzehGM7QRRX5he4fPHx2rdKMB256ehJCkX+XRQm16eZLqLNS8RSZXZw==",
           "requires": {
             "ms": "^2.1.1"
           }
@@ -1043,7 +1043,7 @@
     },
     "dns-packet": {
       "version": "4.2.0",
-      "resolved": "http://registry.npmjs.org/dns-packet/-/dns-packet-4.2.0.tgz",
+      "resolved": "https://registry.npmjs.org/dns-packet/-/dns-packet-4.2.0.tgz",
       "integrity": "sha512-bn1AKpfkFbm0MIioOMHZ5qJzl2uypdBwI4nYNsqvhjsegBhcKJUlCrMPWLx6JEezRjxZmxhtIz/FkBEur2l8Cw==",
       "requires": {
         "ip": "^1.1.5",
@@ -1068,9 +1068,9 @@
       }
     },
     "duplexify": {
-      "version": "3.6.1",
-      "resolved": "https://registry.npmjs.org/duplexify/-/duplexify-3.6.1.tgz",
-      "integrity": "sha512-vM58DwdnKmty+FSPzT14K9JXb90H+j5emaR4KYbr2KTIz00WHGbWOe5ghQTx233ZCLZtrGDALzKwcjEtSt35mA==",
+      "version": "3.7.1",
+      "resolved": "https://registry.npmjs.org/duplexify/-/duplexify-3.7.1.tgz",
+      "integrity": "sha512-07z8uv2wMyS51kKhD1KsdXJg5WQ6t93RneqRxUHnskXVtlYYkLqM0gqStQZ3pj073g687jPCHrqNfCzawLYh5g==",
       "requires": {
         "end-of-stream": "^1.0.0",
         "inherits": "^2.0.1",
@@ -1536,6 +1536,24 @@
       "resolved": "https://registry.npmjs.org/fast-safe-stringify/-/fast-safe-stringify-2.0.6.tgz",
       "integrity": "sha512-q8BZ89jjc+mz08rSxROs8VsrBBcn1SIw1kq9NjolL509tkABRk9io01RAjSaEv1Xb2uFLt8VtRiZbGp5H8iDtg=="
     },
+    "fd-lock": {
+      "version": "1.0.2",
+      "resolved": "https://registry.npmjs.org/fd-lock/-/fd-lock-1.0.2.tgz",
+      "integrity": "sha512-8O4zSv6rlNNghVfzVkj/p7LUIeBm7Xxk6QnhfmR1WJm/W4kwS8IyShy4X1peRnFUYZUYLlcwEMKXF8QWxJCMvg==",
+      "optional": true,
+      "requires": {
+        "napi-macros": "^1.8.2",
+        "node-gyp-build": "^3.8.0"
+      },
+      "dependencies": {
+        "node-gyp-build": {
+          "version": "3.8.0",
+          "resolved": "https://registry.npmjs.org/node-gyp-build/-/node-gyp-build-3.8.0.tgz",
+          "integrity": "sha512-bYbpIHyRqZ7sVWXxGpz8QIRug5JZc/hzZH4GbdT9HTZi6WmKCZ8GLvP8OZ9TTiIBvwPFKgtGrlWQSXDAvYdsPw==",
+          "optional": true
+        }
+      }
+    },
     "fecha": {
       "version": "2.3.3",
       "resolved": "https://registry.npmjs.org/fecha/-/fecha-2.3.3.tgz",
@@ -1926,19 +1944,20 @@
       }
     },
     "hypercore": {
-      "version": "6.22.3",
-      "resolved": "https://registry.npmjs.org/hypercore/-/hypercore-6.22.3.tgz",
-      "integrity": "sha512-ws+dyqqFyuqDgvlJjyhM/Cwu/99n/7kJ8/9QZjZB8p66omoCebmUR7zLIm4jr+JfPzCnP0IzrAluGIHc5cJnNQ==",
+      "version": "6.25.2",
+      "resolved": "https://registry.npmjs.org/hypercore/-/hypercore-6.25.2.tgz",
+      "integrity": "sha512-l6beYZTbWbbsklFv/YehVPofOM2O7T5e3Zz7V4O93xxXb4JhBQ4z3Kgexzl5B0OkbcsUg/bgqRGdqSAS20VAEg==",
       "requires": {
         "array-lru": "^1.1.0",
         "atomic-batcher": "^1.0.2",
         "bitfield-rle": "^2.2.1",
+        "buffer-alloc": "^1.2.0",
         "buffer-alloc-unsafe": "^1.0.0",
-        "buffer-equals": "^1.0.4",
         "buffer-from": "^1.0.0",
         "bulk-write-stream": "^1.1.3",
         "codecs": "^1.2.0",
         "fast-bitfield": "^1.2.2",
+        "fd-lock": "^1.0.2",
         "flat-tree": "^1.6.0",
         "from2": "^2.3.0",
         "hypercore-crypto": "^1.0.0",
@@ -1950,7 +1969,7 @@
         "merkle-tree-stream": "^3.0.3",
         "pretty-hash": "^1.0.1",
         "process-nextick-args": "^1.0.7",
-        "random-access-file": "^2.0.1",
+        "random-access-file": "^2.1.0",
         "sodium-universal": "^2.0.0",
         "sparse-bitfield": "^3.0.0",
         "thunky": "^1.0.1",
@@ -2003,14 +2022,14 @@
       }
     },
     "hyperdrive": {
-      "version": "9.14.0",
-      "resolved": "https://registry.npmjs.org/hyperdrive/-/hyperdrive-9.14.0.tgz",
-      "integrity": "sha512-LTgbsJ+9ZrdQfLaXXc01kQMttaicHhSOtUM3v/k7ORwXJziqQ2eMQ80+8Tfg67ja+w6zrdl5HYOK+mnlwQpCww==",
+      "version": "9.14.3",
+      "resolved": "https://registry.npmjs.org/hyperdrive/-/hyperdrive-9.14.3.tgz",
+      "integrity": "sha512-j722JRSwempuD8fn5VPVDHR/NFBFKxUlZ1ZLvTTipVkV70uWC9OyWYBlYqWp/b4ZgZpVhcpfzqzpsL1i/H+pTw==",
       "requires": {
         "append-tree": "^2.3.5",
         "duplexify": "^3.5.0",
         "from2": "^2.3.0",
-        "hypercore": "^6.10.4",
+        "hypercore": "^6.22.1",
         "inherits": "^2.0.3",
         "mutexify": "^1.1.0",
         "protocol-buffers-encodings": "^1.1.0",
@@ -2500,9 +2519,9 @@
       },
       "dependencies": {
         "bencode": {
-          "version": "2.0.0",
-          "resolved": "https://registry.npmjs.org/bencode/-/bencode-2.0.0.tgz",
-          "integrity": "sha512-wr2HwwrUpfB5c68zmAudOltC7rZ1G0+lQOcnuEcfIM3AWAVnB3rHI3nlgd/2CWTfQ3w3zagKt89zni/M+VLZ8g==",
+          "version": "2.0.1",
+          "resolved": "https://registry.npmjs.org/bencode/-/bencode-2.0.1.tgz",
+          "integrity": "sha512-2uhEl8FdjSBUyb69qDTgOEeeqDTa+n3yMQzLW0cOzNf1Ow5bwcg3idf+qsWisIKRH8Bk8oC7UXL8irRcPA8ZEQ==",
           "requires": {
             "safe-buffer": "^5.1.1"
           }
@@ -2767,9 +2786,9 @@
       }
     },
     "memory-pager": {
-      "version": "1.4.0",
-      "resolved": "https://registry.npmjs.org/memory-pager/-/memory-pager-1.4.0.tgz",
-      "integrity": "sha512-ycuyV5gKpZln7HB/A11wCpAxEY9VQ2EhYU1F56pUAxvmj6OyOHtB9tkLLjAyFsPdghSP2S3Ujk3aYJCusgiMZg=="
+      "version": "1.5.0",
+      "resolved": "https://registry.npmjs.org/memory-pager/-/memory-pager-1.5.0.tgz",
+      "integrity": "sha512-ZS4Bp4r/Zoeq6+NLJpP+0Zzm0pR8whtGPf1XExKLJBAczGMnSi3It14OiNCStjQjM6NU1okjQGSxgEZN8eBYKg=="
     },
     "merkle-tree-stream": {
       "version": "3.0.3",
@@ -2806,16 +2825,16 @@
       "integrity": "sha512-x0Vn8spI+wuJ1O6S7gnbaQg8Pxh4NNHb7KSINmEWKiPE4RKOplvijn+NkmYmmRgP68mc70j2EbeTFRsrswaQeg=="
     },
     "mime-db": {
-      "version": "1.37.0",
-      "resolved": "https://registry.npmjs.org/mime-db/-/mime-db-1.37.0.tgz",
-      "integrity": "sha512-R3C4db6bgQhlIhPU48fUtdVmKnflq+hRdad7IyKhtFj06VPNVdk2RhiYL3UjQIlso8L+YxAtFkobT0VK+S/ybg=="
+      "version": "1.38.0",
+      "resolved": "https://registry.npmjs.org/mime-db/-/mime-db-1.38.0.tgz",
+      "integrity": "sha512-bqVioMFFzc2awcdJZIzR3HjZFX20QhilVS7hytkKrv7xFAn8bM1gzc/FOX2awLISvWe0PV8ptFKcon+wZ5qYkg=="
     },
     "mime-types": {
-      "version": "2.1.21",
-      "resolved": "https://registry.npmjs.org/mime-types/-/mime-types-2.1.21.tgz",
-      "integrity": "sha512-3iL6DbwpyLzjR3xHSFNFeb9Nz/M8WDkX33t1GFQnFOllWk8pOrh/LSrB5OXlnlW5P9LH73X6loW/eogc+F5lJg==",
+      "version": "2.1.22",
+      "resolved": "https://registry.npmjs.org/mime-types/-/mime-types-2.1.22.tgz",
+      "integrity": "sha512-aGl6TZGnhm/li6F7yx82bJiBZwgiEa4Hf6CNr8YO+r5UHr53tSTYZb102zyU50DOWWKeOv0uQLRL0/9EiKWCog==",
       "requires": {
-        "mime-db": "~1.37.0"
+        "mime-db": "~1.38.0"
       }
     },
     "mimic-fn": {
@@ -2888,9 +2907,9 @@
       }
     },
     "moment": {
-      "version": "2.23.0",
-      "resolved": "https://registry.npmjs.org/moment/-/moment-2.23.0.tgz",
-      "integrity": "sha512-3IE39bHVqFbWWaPOMHZF98Q9c3LDKGTmypMiTM2QygGXXElkFWIH7GxfmlwmY2vwa+wmNsoYZmG2iusf1ZjJoA=="
+      "version": "2.24.0",
+      "resolved": "https://registry.npmjs.org/moment/-/moment-2.24.0.tgz",
+      "integrity": "sha512-bV7f+6l2QigeBBZSM/6yTNq4P2fNpSWj/0e7jQcy87A8e7o2nAfP/34/2ky5Vw4B9S446EtIhodAzkFCcR4dQg=="
     },
     "ms": {
       "version": "2.1.1",
@@ -2998,9 +3017,9 @@
       "integrity": "sha512-L/Eg02Epx6Si2NXmedx+Okg+4UHqmaf3TNcxd50SF9NQGcJaON3AtU++kax69XV7YWz4tUspqZSAsVofhFKG2w=="
     },
     "node-pre-gyp": {
-      "version": "0.10.3",
-      "resolved": "https://registry.npmjs.org/node-pre-gyp/-/node-pre-gyp-0.10.3.tgz",
-      "integrity": "sha512-d1xFs+C/IPS8Id0qPTZ4bUT8wWryfR/OzzAFxweG+uLN85oPzyo2Iw6bVlLQ/JOdgNonXLCoRyqDzDWq4iw72A==",
+      "version": "0.11.0",
+      "resolved": "https://registry.npmjs.org/node-pre-gyp/-/node-pre-gyp-0.11.0.tgz",
+      "integrity": "sha512-TwWAOZb0j7e9eGaf9esRx3ZcLaE5tQ2lvYy1pb5IAaG1a2e2Kv5Lms1Y4hpj+ciXJRofIxxlt5haeQ/2ANeE0Q==",
       "requires": {
         "detect-libc": "^1.0.2",
         "mkdirp": "^0.5.1",
@@ -3037,14 +3056,14 @@
       "integrity": "sha512-U+JJi7duF1o+u2pynbp2zXDW2/PADgC30f0GsHZtRh+HOcXHnw137TrNlyxxRvWW5fjKd3bcLHPxofWuCjaeZg=="
     },
     "npm-bundled": {
-      "version": "1.0.5",
-      "resolved": "https://registry.npmjs.org/npm-bundled/-/npm-bundled-1.0.5.tgz",
-      "integrity": "sha512-m/e6jgWu8/v5niCUKQi9qQl8QdeEduFA96xHDDzFGqly0OOjI7c+60KM/2sppfnUU9JJagf+zs+yGhqSOFj71g=="
+      "version": "1.0.6",
+      "resolved": "https://registry.npmjs.org/npm-bundled/-/npm-bundled-1.0.6.tgz",
+      "integrity": "sha512-8/JCaftHwbd//k6y2rEWp6k1wxVfpFzB6t1p825+cUb7Ym2XQfhwIC5KwhrvzZRJu+LtDE585zVaS32+CGtf0g=="
     },
     "npm-packlist": {
-      "version": "1.1.12",
-      "resolved": "https://registry.npmjs.org/npm-packlist/-/npm-packlist-1.1.12.tgz",
-      "integrity": "sha512-WJKFOVMeAlsU/pjXuqVdzU0WfgtIBCupkEVwn+1Y0ERAbUfWw8R4GjgVbaKnUjRoD2FoQbHOCbOyT5Mbs9Lw4g==",
+      "version": "1.4.1",
+      "resolved": "https://registry.npmjs.org/npm-packlist/-/npm-packlist-1.4.1.tgz",
+      "integrity": "sha512-+TcdO7HJJ8peiiYhvPxsEDhF3PJFGUGRcFsGve3vxvxdcpO2Z4Z7rkosRM0kWj6LfbK/P0gu3dzk5RU1ffvFcw==",
       "requires": {
         "ignore-walk": "^3.0.1",
         "npm-bundled": "^1.0.1"
@@ -3569,9 +3588,9 @@
       "integrity": "sha512-N5ZAX4/LxJmF+7wN74pUD6qAh9/wnvdQcjq9TZjevvXzSUo7bfmw91saqMjzGS2xq91/odN2dW/WOl7qQHNDGA=="
     },
     "random-access-file": {
-      "version": "2.0.1",
-      "resolved": "https://registry.npmjs.org/random-access-file/-/random-access-file-2.0.1.tgz",
-      "integrity": "sha512-nb4fClpzoUY+v1SHrro+9yykN90eMA1rc+xM39tnZ5R3BgFY+J/NxPZ0KuUpishEsvnwou9Fvm2wa3cjeuG7vg==",
+      "version": "2.1.0",
+      "resolved": "https://registry.npmjs.org/random-access-file/-/random-access-file-2.1.0.tgz",
+      "integrity": "sha512-W2hY3DboLETMclybTVzyqCNVKx1MjqUwZPzkpkkMD2t9mbGEtkV2SKWPqAJ/FTrAtnWB7aGwl0NDUS82da0KdQ==",
       "requires": {
         "mkdirp": "^0.5.1",
         "random-access-storage": "^1.1.1"
@@ -3614,9 +3633,9 @@
       }
     },
     "randombytes": {
-      "version": "2.0.6",
-      "resolved": "https://registry.npmjs.org/randombytes/-/randombytes-2.0.6.tgz",
-      "integrity": "sha512-CIQ5OFxf4Jou6uOKe9t1AOgqpeU5fd70A8NPdHSGeYXqXsPe6peOwI0cUl88RWZ6sP1vPMV3avd/R6cZ5/sP1A==",
+      "version": "2.1.0",
+      "resolved": "https://registry.npmjs.org/randombytes/-/randombytes-2.1.0.tgz",
+      "integrity": "sha512-vYl3iOX+4CKUWuxGi9Ukhie6fsqXqS9FE2Zaic4tNFD2N2QQaXOMFbuKK4QmDHC0JO6B1Zp41J0LpT0oR68amQ==",
       "requires": {
         "safe-buffer": "^5.1.0"
       }
@@ -3859,9 +3878,9 @@
       }
     },
     "semver": {
-      "version": "5.6.0",
-      "resolved": "https://registry.npmjs.org/semver/-/semver-5.6.0.tgz",
-      "integrity": "sha512-RS9R6R35NYgQn++fkDWaOmqGoj4Ek9gGs+DPxNUZKuwE183xjJroKvyo1IzVFeXvUrvmALy6FWD5xrdJT25gMg=="
+      "version": "5.7.0",
+      "resolved": "https://registry.npmjs.org/semver/-/semver-5.7.0.tgz",
+      "integrity": "sha512-Ya52jSX2u7QKghxeoFGpLwCtGlt7j0oY9DYb5apt9nPlJ42ID+ulTXESnt/qAQcoSERyZ5sl3LDIOw0nAn/5DA=="
     },
     "set-blocking": {
       "version": "2.0.0",
@@ -3916,9 +3935,9 @@
       }
     },
     "simple-sha1": {
-      "version": "2.1.1",
-      "resolved": "https://registry.npmjs.org/simple-sha1/-/simple-sha1-2.1.1.tgz",
-      "integrity": "sha512-pFMPd+I/lQkpf4wFUeS/sED5IqdIG1lUlrQviBMV4u4mz8BRAcB5fvUx5Ckfg3kBigEglAjHg7E9k/yy2KlCqA==",
+      "version": "2.1.2",
+      "resolved": "https://registry.npmjs.org/simple-sha1/-/simple-sha1-2.1.2.tgz",
+      "integrity": "sha512-TQl9rm4rdKAVmhO++sXAb8TNN0D6JAD5iyI1mqEPNpxUzTRrtm4aOG1pDf/5W/qCFihiaoK6uuL9rvQz1x1VKw==",
       "requires": {
         "rusha": "^0.8.1"
       }
@@ -4149,9 +4168,9 @@
       "integrity": "sha512-z/wAiTESw2XVPssY2XRcme4niTc4S5FkkJ4gknudtVoc33Zil8TdTxHy5torRcgqMqksJV2Yz8HQcvtbsnw0mQ=="
     },
     "spellchecker": {
-      "version": "3.5.0",
-      "resolved": "https://registry.npmjs.org/spellchecker/-/spellchecker-3.5.0.tgz",
-      "integrity": "sha512-Xa7XnRulYhh5N/XENeL2O8/875XhLBjos7Bemv0rfcgV6ojNYMSrXscUZUGJwniX2t67eY+lNUJeptD1bMauHQ==",
+      "version": "3.5.1",
+      "resolved": "https://registry.npmjs.org/spellchecker/-/spellchecker-3.5.1.tgz",
+      "integrity": "sha512-R1qUBsDZzio+7MFZN6/AtPUe5NGvnc0wywckuXAlp9akASaYSFqKuI5O8p3rSiA+yKP31qC7Iijjoygmzkh6xw==",
       "requires": {
         "any-promise": "^1.3.0",
         "nan": "^2.10.0"
@@ -4179,26 +4198,26 @@
       "integrity": "sha1-BOaSb2YolTVPPdAVIDYzuFcpfiw="
     },
     "sqlite3": {
-      "version": "4.0.4",
-      "resolved": "https://registry.npmjs.org/sqlite3/-/sqlite3-4.0.4.tgz",
-      "integrity": "sha512-CO8vZMyUXBPC+E3iXOCc7Tz2pAdq5BWfLcQmOokCOZW5S5sZ/paijiPOCdvzpdP83RroWHYa5xYlVqCxSqpnQg==",
+      "version": "4.0.6",
+      "resolved": "https://registry.npmjs.org/sqlite3/-/sqlite3-4.0.6.tgz",
+      "integrity": "sha512-EqBXxHdKiwvNMRCgml86VTL5TK1i0IKiumnfxykX0gh6H6jaKijAXvE9O1N7+omfNSawR2fOmIyJZcfe8HYWpw==",
       "requires": {
         "nan": "~2.10.0",
-        "node-pre-gyp": "^0.10.3",
+        "node-pre-gyp": "^0.11.0",
         "request": "^2.87.0"
       },
       "dependencies": {
         "nan": {
           "version": "2.10.0",
-          "resolved": "http://registry.npmjs.org/nan/-/nan-2.10.0.tgz",
+          "resolved": "https://registry.npmjs.org/nan/-/nan-2.10.0.tgz",
           "integrity": "sha512-bAdJv7fBLhWC+/Bls0Oza+mvTaNQtP+1RyhhhvD95pgUJz6XM5IzgmxOkItJ9tkoCiplvAnXI1tNmmUD/eScyA=="
         }
       }
     },
     "sshpk": {
-      "version": "1.16.0",
-      "resolved": "https://registry.npmjs.org/sshpk/-/sshpk-1.16.0.tgz",
-      "integrity": "sha512-Zhev35/y7hRMcID/upReIvRse+I9SVhyVre/KTJSJQWMz3C3+G+HpO7m1wK/yckEtujKZ7dS4hkVxAnmHaIGVQ==",
+      "version": "1.16.1",
+      "resolved": "https://registry.npmjs.org/sshpk/-/sshpk-1.16.1.tgz",
+      "integrity": "sha512-HXXqVUq7+pcKeLqqZj6mHFUMvXtOJt1uoUx09pFW6011inTMxqI8BA8PM95myrIyyKwdnzjdFjLiE6KBPVtJIg==",
       "requires": {
         "asn1": "~0.2.3",
         "assert-plus": "^1.0.0",
@@ -4276,7 +4295,7 @@
     },
     "string-width": {
       "version": "1.0.2",
-      "resolved": "http://registry.npmjs.org/string-width/-/string-width-1.0.2.tgz",
+      "resolved": "https://registry.npmjs.org/string-width/-/string-width-1.0.2.tgz",
       "integrity": "sha1-EYvfW4zcUaKn5w0hHgfisLmxB9M=",
       "requires": {
         "code-point-at": "^1.0.0",
@@ -4465,7 +4484,7 @@
     },
     "thunky": {
       "version": "0.1.0",
-      "resolved": "http://registry.npmjs.org/thunky/-/thunky-0.1.0.tgz",
+      "resolved": "https://registry.npmjs.org/thunky/-/thunky-0.1.0.tgz",
       "integrity": "sha1-vzAUaCTituZ7Dy16Ssi+smkIaE4="
     },
     "tildify": {
@@ -4820,9 +4839,9 @@
       },
       "dependencies": {
         "readable-stream": {
-          "version": "3.2.0",
-          "resolved": "https://registry.npmjs.org/readable-stream/-/readable-stream-3.2.0.tgz",
-          "integrity": "sha512-RV20kLjdmpZuTF1INEb9IA3L68Nmi+Ri7ppZqo78wj//Pn62fCoJyV9zalccNzDD/OuJpMG4f+pfMl8+L6QdGw==",
+          "version": "3.3.0",
+          "resolved": "https://registry.npmjs.org/readable-stream/-/readable-stream-3.3.0.tgz",
+          "integrity": "sha512-EsI+s3k3XsW+fU8fQACLN59ky34AZ14LoeVZpYwmZvldCFo0r0gnelwF2TcMjLor/BTL5aDJVBMkss0dthToPw==",
           "requires": {
             "inherits": "^2.0.3",
             "string_decoder": "^1.1.1",
diff --git a/package.json b/package.json
index 892aa8a4..feb3b958 100644
--- a/package.json
+++ b/package.json
@@ -25,29 +25,29 @@
   },
   "homepage": "https://github.com/beakerbrowser/beaker-core#readme",
   "dependencies": {
-    "@beaker/dat-ephemeral-ext-msg": "^1.0.0",
+    "@beaker/dat-ephemeral-ext-msg": "^1.0.2",
     "@beaker/dat-session-data-ext-msg": "^1.1.0",
     "@beaker/datignore": "^1.0.0",
     "ajv": "^6.7.0",
     "anymatch": "^2.0.0",
     "await-lock": "^1.1.3",
     "beaker-error-constants": "^1.4.0",
-    "binary-extensions": "^1.12.0",
-    "bytes": "^3.0.0",
+    "binary-extensions": "^1.13.1",
+    "bytes": "^3.1.0",
     "circular-append-file": "^1.0.1",
     "concat-stream": "^1.6.2",
-    "dat-dns": "^3.2.0",
+    "dat-dns": "^3.2.1",
     "dat-encoding": "^5.0.1",
     "datland-swarm-defaults": "^1.0.2",
     "diff": "^3.5.0",
     "diff-file-tree": "^2.2.0",
-    "discovery-swarm": "^5.1.3",
+    "discovery-swarm": "^5.1.4",
     "emit-stream": "^0.1.2",
     "fs-jetpack": "^1.3.1",
     "fs-reverse": "0.0.3",
     "function-queue": "0.0.12",
     "hypercore-protocol": "^6.9.0",
-    "hyperdrive": "^9.14.0",
+    "hyperdrive": "^9.14.3",
     "hyperdrive-network-speed": "^2.1.0",
     "identify-filetype": "^1.0.0",
     "into-stream": "^3.1.0",
@@ -63,7 +63,7 @@
     "markdown-it": "^8.4.2",
     "mime": "^1.4.0",
     "mkdirp": "^0.5.1",
-    "moment": "^2.23.0",
+    "moment": "^2.24.0",
     "ms": "^2.1.1",
     "normalize-url": "^3.3.0",
     "once": "^1.4.0",
@@ -72,23 +72,23 @@
     "pauls-dat-api": "^8.1.0",
     "pify": "^3.0.0",
     "pump": "^3.0.0",
-    "random-access-file": "^2.0.1",
+    "random-access-file": "^2.1.0",
     "random-access-indexed-file": "^2.0.0",
     "range-parser": "^1.2.0",
     "rimraf": "^2.6.3",
     "scoped-fs": "^1.3.0",
-    "semver": "^5.6.0",
+    "semver": "^5.7.0",
     "slugify": "^1.3.4",
     "sodium-signatures": "^2.1.1",
-    "spellchecker": "^3.5.0",
+    "spellchecker": "^3.5.1",
     "split2": "^2.2.0",
-    "sqlite3": "^4.0.4",
+    "sqlite3": "^4.0.6",
     "stream-throttle": "^0.1.3",
     "supports-sparse-files": "^1.0.2",
     "textextensions": "^2.4.0",
     "through2": "^2.0.5",
     "utp-native": "^2.1.3",
-    "winston": "winstonjs/winston#b4ced895b3e1ead8a616590189b003cfd9d7acca",
+    "winston": "github:winstonjs/winston#b4ced895b3e1ead8a616590189b003cfd9d7acca",
     "yazl": "^2.5.1"
   },
   "devDependencies": {

From af51f1e349fac54b14c63ce1cd6947dfb2e4239d Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 8 Apr 2019 10:52:28 -0500
Subject: [PATCH 141/245] Download the source archive for forks

---
 dat/library.js | 24 +++++++++++++++++-------
 1 file changed, 17 insertions(+), 7 deletions(-)

diff --git a/dat/library.js b/dat/library.js
index aae67e51..2c1e23c8 100644
--- a/dat/library.js
+++ b/dat/library.js
@@ -24,7 +24,7 @@ const {
   DAT_HASH_REGEX,
   DAT_PRESERVED_FIELDS_ON_FORK
 } = require('../lib/const')
-const {InvalidURLError} = require('beaker-error-constants')
+const {InvalidURLError, TimeoutError} = require('beaker-error-constants')
 const DAT_DAEMON_MANIFEST = require('./daemon/manifest')
 
 // typedefs
@@ -264,16 +264,26 @@ const createNewArchive = exports.createNewArchive = async function createNewArch
   return `dat://${key}/`
 }
 
-exports.forkArchive = async function forkArchive (srcArchiveUrl, manifest = {}, settings = false) {
+exports.forkArchive = async function forkArchive (srcArchiveUrl, manifest = {}, settings = undefined) {
   srcArchiveUrl = fromKeyToURL(srcArchiveUrl)
 
-  // get the old archive
-  var srcArchive = getArchive(srcArchiveUrl)
-  if (!srcArchive) {
-    throw new Error('Invalid archive key')
+  // get the source archive
+  var srcArchive 
+  var downloadRes = await Promise.race([
+    (async function () {
+      srcArchive = await getOrLoadArchive(srcArchiveUrl)
+      if (!srcArchive) {
+        throw new Error('Invalid archive key')
+      }
+      return srcArchive.pda.download('/')
+    })(),
+    new Promise(r => setTimeout(() => r('timeout'), 60e3))
+  ])
+  if (downloadRes === 'timeout') {
+    throw new TimeoutError('Timed out while downloading source archive')
   }
 
-  // fetch old archive meta
+  // fetch source archive meta
   var srcManifest = await srcArchive.pda.readManifest().catch(_ => {})
   srcManifest = srcManifest || {}
 

From e18279020f7d7b3e810d866ca0b871943737b12f Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 8 Apr 2019 10:52:52 -0500
Subject: [PATCH 142/245] Handle input URLs better in forks

---
 web-apis/bg/dat-archive.js | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/web-apis/bg/dat-archive.js b/web-apis/bg/dat-archive.js
index a04724f8..f3141df0 100644
--- a/web-apis/bg/dat-archive.js
+++ b/web-apis/bg/dat-archive.js
@@ -116,8 +116,9 @@ module.exports = {
       await assertCreateArchivePermission(this.sender)
 
       // create
+      let key = await lookupUrlDatKey(url)
       let author = await getAuthor()
-      newArchiveUrl = await datLibrary.forkArchive(url, {title, description, type, author, links}, {networked, hidden})
+      newArchiveUrl = await datLibrary.forkArchive(key, {title, description, type, author, links}, {networked, hidden})
     }
 
     // grant write permissions to the creating app
@@ -737,6 +738,7 @@ async function lookupArchive (sender, url, opts = {}) {
 }
 
 async function lookupUrlDatKey (url) {
+  if (DAT_HASH_REGEX.test(url)) return url
   if (url.startsWith('dat://') === false) {
     return false // not a dat site
   }

From e2c92bd46edc2cb3c93f8edca86bdf7e47c8601a Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 8 Apr 2019 11:56:59 -0500
Subject: [PATCH 143/245] Update default bookmarks

---
 dbs/schemas/profile-data.sql.js     | 8 +++++---
 dbs/schemas/profile-data.v1.sql.js  | 6 +++---
 dbs/schemas/profile-data.v24.sql.js | 3 +++
 3 files changed, 11 insertions(+), 6 deletions(-)

diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index b0766f48..85b06732 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -277,12 +277,14 @@ CREATE TABLE workspaces (
 INSERT INTO profiles (id) VALUES (0);
 
 -- default bookmarks
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker Home', 'dat://beakerbrowser.com', 0);
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker Browser', 'dat://beakerbrowser.com', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Dat Project', 'dat://datproject.org', 0);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Hashbase', 'https://hashbase.io', 0);
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Documentation', 'dat://beakerbrowser.com/docs', 0);
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Documentation', 'dat://beakerbrowser.com/docs', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Report an issue', 'https://github.com/beakerbrowser/beaker/issues', 0);
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker', 'https://opencollective.com/beaker', 0);
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker', 'https://opencollective.com/beaker', 1);
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Address book', 'beaker://library/?view=addressbook', 1);
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker.Social', 'dat://beaker.social', 1);
 
 PRAGMA user_version = 24;
 `
diff --git a/dbs/schemas/profile-data.v1.sql.js b/dbs/schemas/profile-data.v1.sql.js
index 0bc66e2d..f22c43dc 100644
--- a/dbs/schemas/profile-data.v1.sql.js
+++ b/dbs/schemas/profile-data.v1.sql.js
@@ -59,12 +59,12 @@ CREATE UNIQUE INDEX visits_stats_url ON visit_stats (url);
 INSERT INTO profiles (id) VALUES (0);
 
 -- default bookmarks
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker Home', 'dat://beakerbrowser.com', 0);
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker Browser', 'dat://beakerbrowser.com', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Dat Project', 'dat://datproject.org', 0);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Hashbase', 'https://hashbase.io', 0);
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Documentation', 'dat://beakerbrowser.com/docs', 0);
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Documentation', 'dat://beakerbrowser.com/docs', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Report an issue', 'https://github.com/beakerbrowser/beaker/issues', 0);
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker', 'https://opencollective.com/beaker', 0);
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker', 'https://opencollective.com/beaker', 1);
 
 PRAGMA user_version = 1;
 `
diff --git a/dbs/schemas/profile-data.v24.sql.js b/dbs/schemas/profile-data.v24.sql.js
index cfa37cca..414488ad 100644
--- a/dbs/schemas/profile-data.v24.sql.js
+++ b/dbs/schemas/profile-data.v24.sql.js
@@ -1,4 +1,7 @@
 module.exports = `
+-- new default bookmarks
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Address book', 'beaker://library/?view=addressbook', 1);
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker.Social', 'dat://beaker.social', 1);
 
 -- description of the bookmark's content, often pulled from the bookmarked page
 ALTER TABLE bookmarks ADD COLUMN description TEXT;

From a8286350951a14fae8cbc47951f134faa56326f5 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 8 Apr 2019 13:01:26 -0500
Subject: [PATCH 144/245] Update favicons

---
 dbs/sitedata.js | 10 +++++++++-
 1 file changed, 9 insertions(+), 1 deletion(-)

diff --git a/dbs/sitedata.js b/dbs/sitedata.js
index 99667bff..f8adb2bb 100644
--- a/dbs/sitedata.js
+++ b/dbs/sitedata.js
@@ -266,7 +266,7 @@ migrations = [
       CREATE UNIQUE INDEX sitedata_origin_key ON sitedata (origin, key);
       INSERT OR REPLACE INTO "sitedata" VALUES('https:duckduckgo.com','favicon','data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEAAAABACAYAAACqaXHeAAAQ3klEQVR4Xr1bC3BU13n+zr2rlZaHIskRFGzwLtJKQjwsBfMIxkHiEQkBZkWhCS0v0ThpQlqkjt1xGnssOVN7OvUE0TymcZIiXKeljSdakHnIULN262ZIGyNjENKupF3eIAxaSQhJu3vP6Zx79+7efWnvIpEzo9HOPf/5z/9/5///85//nkvwB2hXt+SXiRQlFORJgaFEnZIRlPHfhMGhPqMEbQLYZUlA26x3u0LPH5WY5FEwvmkrMjMhYAMjm1QlH3YeGRzCjhBqsM+wd3gelk+icRMKwDWbdbckSvtEJoZWeSIFlojUJkrigSfsrqaJ4jtuANw2c5ZBMNYSxvYByEogmIMR8iGhzMPAPAEE2ix2j1dLK/OBoYSAmJlAzISxlYDiInGalxFyIEB9jdF8UgVmXADwFQehrwKCOWpiLwi1C1Q8MtPutKt9qpKy3wsoYRBkwAiol1G08d/R4NywFdioIG0CE2yxAFMPmNAwHot4KADctiKzSKSDJGqFCBSB/PDb+cpwujQhYGPASsIYVzgaqLgLxvkwQtoI8KGfGuwWe4eHg5eGNBsHPJoPAxwSE2s43SO3gCu2Ahsh7KB2NbjAlAkNs4O+ecVm3c2ItE/AxMQCCqmNMPGAlr8QC4SXMVIzW2NxesBIyQKu2grqAfZqBGOBNHBf5M8MMNYCY8YCPTKNReMFyIEAgvMJxlrQKHlAGmbZnfV6J9INwBVb3kFA2B3awyG1iRBrnrC72rhVANL+OLFArxwp0lEPINbx1b5ms5ZI4O6otTbaNNveXaOHqS4AopWnYHaGgDwBgeGgAMID1B+8jS2HPhCSAhCtPKAw5shT4IwaCySjCZMKFiJj/pIQEIHe6+B/oxfOPkpwvAJQrlhipJWqso41+ZgAXLZZ9xOgNsxAUZ4HOQA8EIZaX8ESsK9shuXZNcjMzIyZc/TC7zB05jd4cPY02NDAowCkhgfJWFdF45N2V12iCRMCIEdyplWSNj15RFE+8rnCmltAVsWfgK3cjJz8uQkVpEMD6D/8Iwy2HJpwEAiBDMLlTZGWoD6PN2FcAPj+LQSkcxDVzG5s5Tnjwe+8iRlPrwjNYTKZwP8SNZ/7Enpf3gEOyES2uCBI8FKDWBovT4gLwJWN1jNMCKahTGqjAi0H0swCw7lEwnIXMN6/F+oempEv/55S+gz+aNEKZM14PGYojw+36jZNOAiUoBTwewQqnAFRdgdC4Zjd4iqPFiIGALfNuptoTJ8FmZFAmjtsEcnXbMqqzTAtXSMHRWFybEzQcuDWMPTBb3D/g+aJAUOClxn8Fr5oRLNojKDGEnWQigCAp5vEbwwpyoAGy1FnvWej9QwISXQwiUAjbdFKTPuLV2GYFrviyWDj7nD7+zvgc3ckI03ez5jD3OIqdz9XUE8AJXnjwKT5LNoDVCQAEcSSx3ys2+LeaN1NCImI+Akj6vYXMXvrN5ILNwaFAsJOcKsYb2OM1VhaXE2e9XluiKJ8DlEXVeUdAoCvvuQ3ukU18DFUQ/Q5Ip6NIdGDyp0o/vb3xyuzPJ7Hhhu1tnG7gyTBK6b5LJCMZSBolo0g+Ey1gjAAGwtrQdh+TkSBtryjzlJuPlDNZyzlZ+bjsfp/xvTp0ycEAM5koOUQ7v3i9YngJ7tx93MF5wQEy3GM1FlaOuXzSwiArvV5bjFoJmCsBqLfrnf1b63/FpZ986/HLeyhdy/gkvNzCGCo+fpTML2xRbaG8bSwFfCjtOLKkiR58o91W0IAuKusJUwk8hbHB1iPO7PdGwtrGRSLGKtJ6SbcfeFnWLp0qUx2+foAfnn4PC5f8SJzchqm507Gy3Xh/CARr08u9mLwvg85menw9g/D2XMPX5vuxp0DLyUTIWk/gbLirqqCPtXFicRKLcddvOYAdG/kKS+RU14G1pjX4qrjJkM0FdxEswxaFsD03TdgtVplkgMHP4H1ySxUrZqTVDA9BFe/sWrcVsCI4tLx9FQA0CjLkZGBCFpEMiE/f7oSWdu+GwLgv//vBlY8PTPZMN39d3/xOgaOjj9tjtZLBYXw6E8lY59q/gXHndndPCDqMH8+hgOQrQFAt2YJCAeHRnHkg3YUWnKxeP4T8nZ4bd9EnLZJXV5LZ6NT4waC6MsmXRsLbATKFgFQe15LV3UPT4WhL/HhAEzZ8i0UFxfHqMQVudE7gE2rijFz2tjZoDp4a9076HDfwYHvPQcOBh/r2bZ43FsiAXPMaXGVd2/MbwbkAivPCapJ94aIra4h7z1nffeGAqZ3JT9fXAlW8aehIKiO+/tfOvBOyzmsWpqHxfNnyf/1gLDApsTd7RtLkTk5A9/++jLc/NsdGP7sd3pFSkiX954zRl/SVZXfTAQFEQqh3GCAhwaoW+9sHIChZ20oL488Zyz/s5/KK8jNmCteZJkmK5WsqRYgB9TvPScD1/dvP0bfv/4o2dCk/YJBsAQCMAugvJADRqmddG2wnkHQ3CllpUQQs0iQIClHAA9m5uPqpr2oqqqKIN/3xlF8cLY79OzX+7ejyJKrhyX+98I1TJ2cHqLnANxLAIAhOwBDthTiO9KTnnAOBqGcUckrCMqWDzAH4QkQiJIn53MTWV9Yy4IZoR5paboJrj2vY9myZcjJyQkN4av/8j+2Bv14nuzLD9uiAeBKTyoeRoZlVP6vbXREwK2fT4PvZlrMdISRurxjnY1dqoszyUO61of9Pf+Yk7g2FNQTFjw96ZTY9eevo6h0EcxmXe89dHINk3nffQ2jn70lK5wxZxQcgLEaByCeJTCCBut7znqtzsSlAcAaBAApAnDNthc5S8qwcOHClJULDZD6wUbOA0MfhR6x4fPKM99lXXwDfQbceTcnrvIygyAAWp0nBIC7iyvhX70VK1YkT3ljNJH6QW++CNb3ji4l4xHx1e7/eCoetCcuwT1SAO5bFuDGuj0xgTCZRmygBfTaNwGpPxlpTD9f7aF2EwY+ngL+W1eLZwFOHgShBMEC7gI8COrMAtVJ/VNz4NnxSkwgHEsoNvRfoD0VuuRWiXiAG7pokleaK59q44ci67HORmfI7SUPca4Ll7skKlgMBpgZVfbJVJpn5yswf2lp6EyQbCztqQTT+LtK33f6C3IEN87wR7DgZj48xhaXbD45BAhCeSAAjygE8xzGHMRVld/MgqkhJ+D7JKDuk3rYKjQ3q/Zg8rI1WLRoka5B9PLXwF1A2wZ/Pxl3fh3eSnUxSolIyXPUBSagdtJZFU6FGSF1Rcc6Gzur9KfC6vz3llRi+CuxGWEi+XjQk/1f0/gK33hrWkoqceL0mX6M3ojd96MZFR53ko71hfw2i1rnaCCd6wpsar2MH4YKj3dVc7dgOqvA6iTDj+fjum0v1q5di7S05MLwcRyA6OjPQeBukMjcubLGGT5Z6Yw5I0gPugqPCbfe/mJC8AhjjoITrvLOqvBhCAzV5FJlkVkgau4veQpPdFtkq0gxF+AZYc/zsRlhsuUc/u12GEQ7BBONIdWCIGRQWelErfc/csBdKDECaCg87qzvXBcO+pQJFrkg0qF5KBClIEJZ6nHg8q5XYEkhEPJ5rv9gL+7/9jQmzxvGlHnDmFw8HBeMRIpxkO6dSmwx6rhYvSRP0YluFQDrfgRLYgBrLDrhqtOCkmwV1f7eNdtgfGZdzNF4rPFXX9qBB+cjj7qmOaMw5Y3CFDTxaOvgSg/3ZMhboh7fBxRlO9bF6ilbwKXKojJC1K1PIb5UlfqZoP+plehftVWOA3rbrR++hP7TwXqM3kEp0vEzwNzjznrtojImlM892eEIlcW1nRSoNqX7HKOjSqlMb+OB8Eb1Xrk2MNabYS2/z3/1Y9z91fjP+mPJmJ7uyx4eNZYJocqXssh8TAiAS5Wa7RDMUXzSVX6xsuCgAITuBekBoucv98u5gN6XJNz/r722Vw/rh6KhQNO8k86a9krrGRIu8zXMPalcpAoBcM5mzjING92MqHcChPKRjJG2yGfJZbi27QXMfPqZuDXCeKP5u0DnlsXJGT8EBWHwDpt8loyRjBIEizzqs9LgTdWIl6MdFdb9jATfDzC0Fbc6S9vXRSQOScW4+6wNhtWbUwqE7r02jPaM/2VotHA8sSs+0dnYXlFwjhDltRhhrLGoNXxlJgIAbgXpw0Y3VCvQMECQQTIE7s9dgjtrtqV0MrxnP4TbP5uQ94Bh8TQLCDXzY/COmnwWdfUjXEAdebGyqJ6w0OVDLyFEeVHCGK+jJboMHZrYlzsT17e9INcG4l2Wigeg//Z1dO1aHdM1miHgky9NxcX5UzDvwn18+X90H5vjys0IaZh3siPiEmXcKzLtFYVcWfXKe1txa2dp+1d5ykx07Vfuv/qhHAPUEtlPPm3AcOA+SnKXo3TacjyWEfsW+fLf7IzIB67OykDruscwkKmc9XN7fdjx9s1kBqj0M1Zd/L7THk+PaAZxAbi41loCQdDcB2JN81qdNRcri3aDyfeEx2y3/ngvvrh0ZahE9vzpyHM/B2LN7GoUZi/Eg8B9OPvOo+PjwzIAmQMB9Oam4dyi2BcpdW/qKI0RUjPvZEfTxYqCgwAJ72CUls475ZJvpGtbwmty7RW8MILw22GVsQ4QvEsrQNeGS2TRAKgCZItzMEp6ZRD0tKQAJJCRAHXFrcp9AN0AcMIYFHWC8GDOfPRuCJfIEgFw8y7DjMeSXlYNybz97ZuyK8RtCWVTrDcRwElnv7CWV4yE0AUpwkjNvFMdTTwmUMgXDmICYyAzB9drXg6VyCYKgC2Hb+OJqyPRungFsBru8xfXFu1mylX+YCygjvmnYq/G6XIBlehcmTlLMKafEcNBkW+mTfNbnTX8KO2jrDmiLziQA2BZpJTIXjv7HVwdDL8l4iQjPqBvMDUL2PPWdWT2h98JSECbUSDVc092eC5wn2dhn+d91DdaXuqI/DQnJRfQgpCWltastQTt5J99taieRH0ncGfDHkxdvlpOi9/8/Yvo7DsfMbfPD9y+R/F4rgBBULooBUqmLUfvlU9wa1LMSqP2H0JB0MtADix4v6M+7iIw6vD7/dXJlOdzJnUBrdQcZaZBGYCXEDTMb+1s5JaSlm7cr/b3L6uAr0wpkcUDYJJhCnxDuXDdVSwjLycPz8x6Bjuf2gHvqWa0//wVdOdPQo/VhGuzMuSVr3nrOghhTf5RXx1X7gIP1ErhJuSGvJ9bp56gmjIAfIA8KdXsDvJ7duogTGxYcLrDwYEwGDNqh2cV7bqz+XkzPxqfvPrvONrzL7JMXHG+Ba6ebZN/J2rOnavhu6VckCI04GFi2qGAb6SRK/7ZmqIyRqRXCcKxSaYTUMcXQ6/yDwUAH8TzhAAVDgpC+CtQ/pwDAUIOLHzfaW9ubs4yGo22FStW7PMbh0sOd/6TnASV5H55TMVV4fs/avVe+bt9TSKjh9T9+zxPxhjbF604pWgzCLQm3j6fDIyUXCCaGfd9Fu97QRrwQDTYufDF7zv5SxddGaSWP2PMIQhCOQdbIsIuSAEbBEPM53mEKLEgmaKJ+scFAGfKTV4UjfshaLIu7WwcDIiOzLW2LNOMWZ9mr9v6hbTc6XJSz5SPI0ONDfZlDX561jvq6TH3f3TMM+J2muMordBT1iRJSix4WOUf2gXiTahslxm1RPLvSij0eCSVlVZiAQ3GgvGym1AAtMKcX82TJGwikMpAYsw2NblZwMMgOgTgyML/DH+FmhqTxNTjdoFkgpyrLDKLEsoYg5lAkk2eQeAnzegM0ktA5cMKg/ghIfBIIhylJ1P/GjSZTNr+/wca6dPApxwOmgAAAABJRU5ErkJggg==');
       --- beakerbrowser.com
-      INSERT OR REPLACE INTO "sitedata" VALUES('dat:87ed2e3b160f261a032af03921a3bd09227d0a4cde73466c17114816cae43336','favicon','data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAEAAAABACAYAAACqaXHeAAAPQUlEQVR4XuWb+3OU13nHP+e97UXoCghZEkI3JIxBNleBkEF1bCfxpOmk00k6burJJNj1OPZMJtPmp/4BqZufWqfTum1aTzqJ3YzHTe/jjB1jxN3mjgEhgQQCBEgghLS7et/d9+08593l4kpoJe14QnwYRovYffec73me7/k+l6O4e7zQVwpFdZBZDUYHPo8A1QQsxGABELnn/b+5/5jEZxzFCHAJgxPg7wbzGEyc5/Wmm7mpK/3ilTMRvOJSfL8WZbTi+yuBVUA9gVoIqgSCOAr7N3fNd80swAOVgGAMFQgI/cBxAuMTMv5pIsYg9q2b/PXyyRCAF4cqyag2gmA9KtgMNENQSkARSjkE2ChMwHggAACfgAwKjyBwUUwQGKNAL8rYA8HHmMFR/rbqqkLM3os1YVlPEfidEKxF8VB2oSFAD/oICEAFwGXgEMroJp3+FXayT/HC0Gp8be7fAMQCKoDobx8AsiKVBG4AHwFvYXBc8cLFZwnUwwTG14CHIVDIn/kOA0xTEbHBMsMHKsXtB+de3/M7+WIFsmFBAG4aEikfLz3fyWQ/f8cSTqL8d1DBScULl18jCGqADQSqWr91vgAIU9iKeNxgUYnBgqjCUmAaYCiFIa/lp4Ck5HchueT+T+bp+XDjls/AlTQ3x31BZf5DAyDrCy4BB1DqomL75V+jgjIC6lGqbP7fAvGYYnGFRfVCk/rFJuVFIQB64cZdAOQWf/un0oAEQQjA+ZEM+/pcBq5mSKV8MplCzA75glEU/QRqVAA4DcRQLATihfiKZYtNtq6Msq7eZkWlweIi47b53zb90NJC17j9Omd6AX4An1zJ8PaxSQ6c87gynGYiUQgz0CtMEGiNkFR85/IwSlmFPOdX1lh8vT1OV6vDykqDsqgi6cFkJiDjoxcnSxE/l5F7bRsQsxURCxwTjl3J8MahFB+cdukfTDN6yy/E/sgXhjohCNKK5y+nCDAKec6vrrV4tiNOV4vD8kUGtqEYHPMZSfhMeEJu4Q5/+m+xo6gpNahcoCiPKs6MZPiXw5Ps6HHpPe9xfaxAANzRCb4AUDC7ym1P21KbPxYAWh0aKwwmvIC9g2n6hjOMJXxS7h0AxAoECLGMymKDthqLlsUmdWUGF0Yz/OzoJDtOu/Sc9xi5WTAAblvSZwLAwFiGfz4yyf5+j/HrGSZToQ/kkBcQ5HX9IpOulRHaG2zaqkyujfv8/KjLBz0uPQPugwvAyZE0P9ob+vLEcBpvGjJrrrJ4Zk2Uba0OG2stbiSzAIgFPHAAbAk5QFxAAPjLPSm9k4kZAPjymqh2nRwAb4oFnHY5/UACkOWAk8OzA2Bbi0O7WEDKRwAQDjj1eQHgS4+FFiAAjOYA6HE51e8y/ECRoLjALC2gqcoiB8CmLABvZUnw8wVAi8OmpaEF/OuxkANO/lZYwOksCSanlh5NSyy+mHUBAeBmFgARQp8IAKMPkA54rjOuj7PGcgMhwVd33zkF0vcB4GkBoMVhc53FmABwPCRBAeDagwLAY3U233o8BKC+zOD4tTR/sTulJW1yOM10ADQusXjq0RCAjjqLCdfnnU9CFzh61uXKjQfEAtYus3m+K9QB1SUGR66m+aFYwGmXyZE0mWksoKHS4sm2EIDOeovJdMB/97gauP2nXS6OFCoevhNTFVQKKwMsW7Gx0ealbXEeb3J0JHjgUpof7kzyYY+LdzODPzk1B0j+YGNrRJ8ez7TYxCzF/sG0FlD/czhF71C6MImRu2LKggJgRxTxMoPO5Q7f64jRvtTWgU73OY9X35+gu9fFlzhgmo0sLjaoqbE0ANvXRmmpMLl8y+eDMy6v70zycb8HmbuCiAIExwUFoKzUoKHO1gt4ri1CY7nJpbFAL+Dvd05wUBYgbjxN/JkDcMtyh1c2x2ivtXUi5cB5jx/vTNJ9xuXWuI/rFi6ALSgAEsx8KavlRcn5Puw+n9Y+/O7RFGev3N+Ecy60rsHm21vEhWyWFBkM3MjwC5HEogjPu4wULi9AYQCQZKetEPLbnp34Q8V3Jv7hmXDi+UrZ5Q9ZPLM2GxVWWzpXIEAKF/wqDyBn4xkFAcCIKOwSgy3NDt/viNFRZ+sEqDbd7tB0x27lb7rlpQbNyxx9jH6zzaGhzOTiWMgF/7AzMaMrfeYAFJcY1NSGvr/9sYgmr6HxcMJ/lyOvdP7k5UQVC8pMDejLm6NsqA1LkiEXJNjV6xWMCwpiASJgnhQB0+qwpc7SOf69F0Lf/98jsz++pF5gOUpnlb+TdSnJLPdfz/DW0Ul9nPZc8ArCBfMDQFZqKdYss/n25hjbmh1qShWDoz5vi4TNavhrcwxjhQu+si4Edn21hZcJ6B4IueC9Y5Ocm4FU83GF+QHgKCg26Gh2+MGWGI8vs3QG+KMLHq91J9kpvj/mMzmN8JlpghVlBi31jgbg2VUOy0pNnV3WXNCd4NAMx+pMzw/LEfPICseLDSqrLU1WL62NsnKRydVxnx29Ln+zM8FH5zyQut4cJbxwQUm5qYXVS5uibKixtYTYP+Dp53f3eoyLLvDmrgvmBUB9pUlXWxRJYXXVZ3f/Ymii/3U4xZnL6TkvXnYnxwUbGkIu6GxyWBxXnBUuyNYLzgx6XJ9HwWRuAGjfBx31bQp9X/L4l8Z83jkR+v6xcy5XJXxV6OJodalJSTSs/k5XepZ9FOl8KxVw6WaG8Wz6vOUhi6+uj+kgaW21qQsrH/aHQL9/fJL+q3OPEeYGgAMsMOhocvizzhhbl9k4puLjwTSv7UoiwufmaIZJkaymoqXK4qttER5eYmYrxFN7pyxeiqInhzL857FJeiT4yQQsLDVY0eBoAP5wlcPSUpMLN30NwE92JTg0cH+JfT8umBMA8QUGi6otPaHvro/yyCKT4YmAD3pdrdkPnHPBC3AsRckCg42NDt9qj7J2qYWlS+TTAOCHAAiQb+xLsf9sqP1FIpdVhFzwYnuU9TVhkJXjAtEF4xNz44I5AVBXabJ1VRi3P9FgETUVBy+JSXr8+6EkPVnfl96AFXWOnvjvr3K0BeQaJaaCQFeIAjhxNawKi4KU8/7GuI/tKIQLtnfG2dJksyhm0DeS4c3Dk9rieufIBbMDQGZvQVudw3PtMbYtd2goN7hyK8MvJXPT43Ikl7lRIALp6SxJSoZHeCKfMTCamfK8b622+L31oS54rCpMmHx4LuSCX5+YGxfMDgBRpEUGm5sc/rQzztZ6m6gNB8X3dye0QhsdzZ77pmJtvc3znXG6lktmSFESya/zZiwVTHneLy41WNno6FPn66scaktMzo/67Dgzdy6YFQCxIoNFVWHCQnx/VaXJ9WTo+6/tTLD/rNS+Q98vXmAgcf13O+N0CFCW9Arls/9oxZdKw+5z9573hgUVFRadzTZ/sinK2mpb50fucIGrucDz8vueWQuhpYtNtqwMTfDJRosiW3F4KKOPvX87mOTUxfDcX1hi0LLUZmuLwzcejbB6iaXP9OnI79PT9YOwkeLY0L3n/WjCx3EUG3Nc0GhTETPoHcnw80MpbYF9l9K6tyjfkZ8FZH1/9VKbP9oY+n5zhcG1iYD/OBWe+wd7XYauZ/Qh37DE4gurI2Fyc5nFsrI8t/5Ts5ZEyFTn/Ypqi69tCDeircoi6QV8cDbkgh0nUrqnKN+RHwDi+3HxfZvvS76/wSZuKw5dEt9Pah8cvS6NTIFu91pTH7K1AFVbYlAazc/3Pz3pm6lgyvO+ssxglXBBq8MfrHSoLjYZEC7ocfmnXQkOn8/qgjxQyAuAWJGiotLS5PNKe5S2SqncBuzo8/irnRPsE9+XgEeknKN0HP+DL8TpanaIWWBL69cchpsJGHfRwc+P3ptgT6+rY4tYVLFwocXjzTbPt8dYU22R9mFfv8ePP0ywu88lkcivvzAvAGoWmbSvCNn3y8sdzebHh8Ko7O2Pk5y8mEVcLD1uaN//8yfidDXYt3sD57B+TYYJD02yr743wW4BwAt7C0MucHi+M6YVqfQU9VxL89ODYb5gYCjbXzjDF+cFwHLp3FgbCp8NtRKXo31TSlbvH0+FWlyGJQ13ovxsXu6IsWmprclvbvuPPgnEDfYOuLyxN8kRkbx3RZdyzL6w7U4BRvSDFFNnU0vMCwAJRn53XRj1rau2SHgB754JSWfPqRSDw1nSkZWaIGXup1dFaa2ydMublS/9f2q3NAeMZTh9Oc3hvizJ5gheoTNGL3YV6Y2pWqDQAMyylpgXAMsk7BXp2xqGvUopdko0JhZwLMW5nAVkF6CPwVqbJWUmEXPuANxyAy6OZbgy6jNyPU0yW1KzLSiKGbQ3hmS7qd5mgaM4dS3Nz8QFzrj0Xy6gC+gsbbbg8c22CLWlJmevh9HYT7sTHL1wr/JwLCiOG0TssPVVQuC5DCE2OeJSXqCLIblW2bIFBvUPWTy+3OHZNRFWVFok0gH7znm83p1kj5BgsoAkGI0qHY0Jub28Ocaj1RbjbsDecx7/uDPJRwMenh/2/s1lzPZjtRUmG5sdnSB5otGiOKI4NZzRG/LmvhQnZEPyfGheLmCYIetK7u97vxOno9HBNuHUlQy/ODLJwYtpxiZ93Qr7/0Yw8/brVtk8kZOnSSPlV1ZGWF8bBlhSP/zlyTAYO5wTZHk/L99WWUVY+dkasm5NiaFbWHYNpOkd8RlzpwBAS4OZAZC5zgaAhjKDrkab+vJQYR6+mOYnB1Ls6nW5OpwmMU35/S5Mcldq/Fk1S+caGQUA6eMrjymGE74WK1O6QL6rmiUARY5icZHS4F6d8NnV5/HGbqkeuzoLNWNb/T3N0rNolxcJ2tbgsKnJ5qnlDk0LTR3gzLjHM74h3Js836aTJoLtlXGfY1cz7OnzePdwij5JoeU37mqXn8WFiUhEUVpm8EiNxRcfjtCy2CJiKq32phu5uwD5zCtfAIRs037A2Rs+7511OT6YZmgozYTcLMln3HNhYjZXZvRVGKgRFq53qCs3dTL0flI/3yMw38XL+nR3eRDoAGj3BY9BaZ1J+qFKvN+Y8srMbC9NyaUGR1FRZOiIULvAbGafzw7l8R5xA2nDlzsISck+ixidiXOmvjR197W5YAOKcoLstbn5Xp7KYyGfyVtyOz/1tTm5LxxrwjeeRgWdBKwBVVWw63OfyQrzMf3pLk7KZ7efXQKRNjDXAZv01Vnly02yz8HVWQFALk8nzTKMaA2+0Yr6vF2ezlnQ5/D6/P8B2ux6/VAGgRsAAAAASUVORK5CYII=');
+      INSERT OR REPLACE INTO "sitedata" VALUES('dat:1919b7b61d581c7877d20842eea7a1a033f251e9c1bb0050b4209294d2c3a1ee','favicon','data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAACAAAAAgCAYAAABzenr0AAAFlklEQVRYR8VXaUxUVxT+3nuzgDN1wQ1RoyW1RaVWWxeQWnCARCFVREag1SjQNG6o0Da2tEFpYtXE2lpjjSaaVKVVJDYqYKs4aCKL1hWrFUOjVTBSZKDMMAuzvOZyHea9mXnDSH/0/oGce5bvnfOdc+4w+J8P09/42uh/QljVwJFgwTG8SX/0nOpJf3wFDEA7+Y6CDY1YxYBJ58FE+w7GN4Dnf7Y5rXtOXBjQFAigPgFotSUco1+8iwG7JhCHbh2+kuHas4+eHfrYn51fANq55liWDaoEIHux4G5tJ2//7LhOvk3KXhKAVmNZyzLK3f0NLLZznD52XrbAly+fAJZoLCsZRrlXKjjPA7ZuwOGgGiwLyBX0r7SNvaJEJ0/2vPcCkBrXFiXnQmp9ObLbgRGhwPxFwJQZwKjRNGjbM+BePaA7A1yvo7KgYMDpBDhOUA6n6cvjVapNQt9eANLjnQaAUfsCkFsAxGj8F4VkBjwgVwL6Z0BOCqAMctuYLQ8iTlWHN7gkIgCL5xqKZKy60DNE8ABg12Fg4CABx3mg8R7QbQVGjQFChnkDM5uAjASA2LsOz9t+K9EpZvoEkB7vdACMqJKkzvtLgSFDqUmXEfh+O1Cte55eBnDYgdAwIGsdMGuOO5ipC8hMFAPo8WG9P7Xs0mu3yP+9GVgU+7dWIRteIvwOUsPsXGDeIipt/gvIzwYYid7p7gaSU4GcDW4vKTGUD8LjsHcdLL2ozhEBSIs1HONk6iVCRZkcOHKGSkhuliW5mS/FBJsNWLMR0CRRjW0FwM0rYm2et7WX6BQhIgBajaWJZZSjhaqJ7wI566mkeD9w+pgwZ1IQaBf8eJbeX6sBthYAMsEoIxmsub865NGjve29yUyPd/CAu/yk9vmbgOg46ujDNKCzQzqo8MZuAzZ/C0ROAwgRMxOAIAERia7RdDOmvHZajQuAIiOBt5IB4zqknbbvA16ZSCULZ3uTSQoO8bN8DZCUSjV88cDY1bCwvC7ilAtAUEYCb/YEsG0fMKGfALLWusnrC4DBeDul4vKUk+4SaBy8sANJCTZ8AcTE069YnQnoWwMrAcnelj1AxOuA0QAsnefdCS0dlXMuXEu81AtgcZyhScapRSSMmwes/JgGLT0EHP9BugWF0BRK4FA5ldReBHZuFo9kQsKyugkjjMbG1l4AC95+fCJYOeZ5x1NjovjTObfrrAWUVP4OmYyffgXMfD6QivKAP26LLRx2k770oqpntPUC0Ey/sGzEoNhDAh6CdwLp2UDqUuqAlGD9croJfR2rBVi2Ckh9n94+bATyVoh3AZF3mR8Ul9WE93gVzjSlVmM1sIxCLnROBsvuI0DYWCol3Dj4HXDuNAVCskRG8cQpQPY64NXJbusPUgFjpxgq0b/zcOvs240FPRtXNFQTZ13ZEaKe8ZHn15GV+vVBIFTEEKC1BSBfTZaReO0C+VnA02bvPFksT26crB79puvGc6qr02KNzZxMNdDTlAyXrFwgOc0/B+qvAjuLAIvZW48Eu3pvdXRj8946KQCIDC9Mjny5qEzIBZcyWU5ksZAR/cZ0mhGWo9wgRDtfBjQ/oq8jz0NS36LXfVN1PT5feOdzr0VFFheMD31vi3Aw+cqI8ElGFpfUliRBOk13KytqJ88HYO8TAOFG1KTDhePDlm72B8J/MegtAdVhuHX2l8tTUwB4Fcbfs5yJGLcxMzK88ADHDhA8qgIJ69Zpai3ZUV2f/jkAn83b5w8TAGPnvnV++/BB72SyjIw89/o89Kvrq6/cXfGJ3nCDEE7SLBAArnYNj5pUnD3kpalJquBxE+VylbLXLZkFDhvM1uY/O7t+r7rRkHeg09x4DYCtL7SBAhD6IYNqMICRwwbHDue4IK6l7Vc9gKdkWAKw9BU0EBK+iI//pPsvk2faMApC4F8AAAAASUVORK5CYII=');
       PRAGMA user_version = 1;
     `, cb)
   },
@@ -305,5 +305,13 @@ migrations = [
       INSERT OR REPLACE INTO "sitedata" VALUES('dat:4fa30df06cbeda4ae87be8fd4334a61289be6648fb0bf7f44f6b91d2385c9328','favicon','data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAABAAAAAQCAYAAAAf8/9hAAAAHklEQVQ4T2MsOrXzPwMFgHHUAIbRMGAYDQOGYREGAKNTL1G9PdjfAAAAAElFTkSuQmCC');
       PRAGMA user_version = 5;
     `, cb)
+  },
+  // version 6
+  // - more favicons
+  function (cb) {
+    db.exec(`
+      -- beaker.social
+      INSERT OR REPLACE INTO "sitedata" VALUES('dat:b3c82a26487167c276dc8539dcec97f52a95c8231bc2d41d28886ed36184d3b1','favicon','data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAABAAAAAQCAYAAAAf8/9hAAAAjUlEQVR4Ac3BoQ0CQRCG0e/fG0UDJEs3WBw14KEVPDXgsBhquQs0gLsMKyasHYKA9/g5EXaX5whUcqbTZrGiKXSVvEoodDN5M8EIjq+FlmS43wnGm7ZAJUOagBuNEQR7PnOgKXzJ6I5AJcN9JBjB8bPQkgQXD4IRhK7AQILQDBhNoRvIGwiFbiJv5G+8ABIEG1xwcZ4JAAAAAElFTkSuQmCC');
+    `, cb)
   }
 ]

From e6c82cbc82c36204a19869f5fa3e07bb9af5f4c3 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 8 Apr 2019 13:22:08 -0500
Subject: [PATCH 145/245] Ensure /data exists on follow

---
 crawler/graph.js | 1 +
 dat/library.js   | 2 +-
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/crawler/graph.js b/crawler/graph.js
index 1a18a289..b055be9b 100644
--- a/crawler/graph.js
+++ b/crawler/graph.js
@@ -388,6 +388,7 @@ async function updateFollowsFile (archive, updateFn) {
     updateFn(followsJson)
 
     // write the follows file
+    await archive.pda.mkdir('/data').catch(err => undefined)
     await archive.pda.writeFile(JSON_PATH, JSON.stringify(followsJson, null, 2), 'utf8')
 
     // trigger crawl now
diff --git a/dat/library.js b/dat/library.js
index 2c1e23c8..e8056c04 100644
--- a/dat/library.js
+++ b/dat/library.js
@@ -268,7 +268,7 @@ exports.forkArchive = async function forkArchive (srcArchiveUrl, manifest = {},
   srcArchiveUrl = fromKeyToURL(srcArchiveUrl)
 
   // get the source archive
-  var srcArchive 
+  var srcArchive
   var downloadRes = await Promise.race([
     (async function () {
       srcArchive = await getOrLoadArchive(srcArchiveUrl)

From 5cdc7d559a4d5c2e719115a944c716bd23ac6c63 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 10 Apr 2019 13:29:57 -0500
Subject: [PATCH 146/245] Add sortBy, offset, limit, and reverse options to
 bookmarks.query web api

---
 web-apis/bg/bookmarks.js | 29 ++++++++++++++++++++++++++++-
 1 file changed, 28 insertions(+), 1 deletion(-)

diff --git a/web-apis/bg/bookmarks.js b/web-apis/bg/bookmarks.js
index 859cbe74..49551b3c 100644
--- a/web-apis/bg/bookmarks.js
+++ b/web-apis/bg/bookmarks.js
@@ -40,11 +40,22 @@ module.exports = {
    * @param {string|string[]} [opts.filters.tag]
    * @param {boolean} [opts.filters.pinned]
    * @param {boolean} [opts.filters.isPublic]
+   * @param {string} [opts.sortBy] - 'title' or 'createdAt' (default 'title')
+   * @param {number} [opts.offset] - default 0
+   * @param {number} [opts.limit]
+   * @param {boolean} [opts.reverse]
    * @returns {Promise<BookmarkPublicAPIRecord[]>}
    */
   async query (opts) {
     await assertPermission(this.sender, 'dangerousAppControl')
 
+    // NOTE
+    // The crawled and local-user bookmarks are stored in separate tables
+    // For now, those tables are queried separately, combined, and then filtered/sorted/sliced
+    // That won't scale - we really need to leverage sqlite's on-disk indexing to perform well
+    // We should plan to rewrite that way
+    // -prf
+
     // fetch user
     var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
@@ -97,7 +108,23 @@ module.exports = {
     }
 
     // apply sorting
-    bookmarks.sort((a, b) => (a.title || '').localeCompare(b.title || ''))
+    var dir = _get(opts, 'reverse') ? -1 : 1
+    var sortBy = _get(opts, 'sortBy', 'title')
+    if (sortBy === 'createdAt') {
+      bookmarks.sort((a, b) => (b.createdAt - a.createdAt) * dir)
+    } else {
+      bookmarks.sort((a, b) => (a.title || '').localeCompare(b.title || '') * dir)
+    }
+
+    // apply offset & limit
+    var offset = _get(opts, 'offset')
+    var limit = _get(opts, 'limit')
+    if (typeof limit !== 'undefined') {
+      offset = offset || 0
+      bookmarks = bookmarks.slice(offset, offset + limit)
+    } else if (typeof offset !== 'undefined') {
+      bookmarks = bookmarks.slice(offset)
+    }
 
     return bookmarks
   },

From 81380bd66f44ce566172d33c533bbca21d79b501 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 10 Apr 2019 16:45:03 -0500
Subject: [PATCH 147/245] Remove leftover primary key declaration

---
 dbs/schemas/profile-data.v24.sql.js | 1 -
 1 file changed, 1 deletion(-)

diff --git a/dbs/schemas/profile-data.v24.sql.js b/dbs/schemas/profile-data.v24.sql.js
index 414488ad..5b2b5daf 100644
--- a/dbs/schemas/profile-data.v24.sql.js
+++ b/dbs/schemas/profile-data.v24.sql.js
@@ -43,7 +43,6 @@ CREATE TABLE crawl_site_descriptions (
   description TEXT,
   type TEXT, -- comma separated strings
 
-  PRIMARY KEY (crawlSourceId, pathname),
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
 CREATE VIRTUAL TABLE crawl_site_descriptions_fts_index USING fts5(title, description, content='crawl_site_descriptions');

From aff252923f1caa6ff8d18567736a8425b409af22 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 10 Apr 2019 16:59:18 -0500
Subject: [PATCH 148/245] Ignore failures to track size

---
 dat/daemon/index.js | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/dat/daemon/index.js b/dat/daemon/index.js
index 70ddcf6e..210d916e 100644
--- a/dat/daemon/index.js
+++ b/dat/daemon/index.js
@@ -471,7 +471,11 @@ function getArchiveCheckout (key, version) {
 
 async function updateSizeTracking (archive) {
   archive = getArchive(archive)
-  archive.size = await pda.readSize(archive, '/')
+  try {
+    archive.size = await pda.readSize(archive, '/')
+  } catch (e) {
+    archive.size = 0
+  }
   return archive.size
 }
 

From a208287b1231c736d55a1a9a913c7a6dbbad17c9 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 11 Apr 2019 12:59:23 -0500
Subject: [PATCH 149/245] Fix search-character escaping

---
 crawler/search.js | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/crawler/search.js b/crawler/search.js
index 3c3f5292..75e82b53 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -173,8 +173,8 @@ exports.query = async function (user, opts) {
   // prep search terms
   if (query && typeof query === 'string') {
     query = query
+      .replace(/[^a-z0-9]/ig, ' ') // strip symbols that sqlite interprets.
       .toLowerCase() // all lowercase. (uppercase is interpretted as a directive by sqlite.)
-      .replace(/[:^*.]/g, ' ') // strip symbols that sqlite interprets.
     query += '*' // match prefixes
   }
 

From e27cf0c1a6c839633802b66491522396e051f482 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 11 Apr 2019 13:10:04 -0500
Subject: [PATCH 150/245] Keep beaker:// sites out of the search index for past
 visits

---
 dbs/history.js | 22 ++++++++++++----------
 1 file changed, 12 insertions(+), 10 deletions(-)

diff --git a/dbs/history.js b/dbs/history.js
index 90c90bdd..c689890a 100644
--- a/dbs/history.js
+++ b/dbs/history.js
@@ -52,17 +52,19 @@ exports.addVisit = async function (profileId, {url, title}) {
   try {
     await db.run('BEGIN TRANSACTION;')
 
-    // get current stats
-    var stats = await db.get('SELECT * FROM visit_stats WHERE url = ?;', [url])
     var ts = Date.now()
-
-    // create or update stats
-    if (!stats) {
-      await db.run('INSERT INTO visit_stats (url, num_visits, last_visit_ts) VALUES (?, ?, ?);', [url, 1, ts])
-      await db.run('INSERT INTO visit_fts (url, title) VALUES (?, ?);', [url, title])
-    } else {
-      let num_visits = (+stats.num_visits || 1) + 1
-      await db.run('UPDATE visit_stats SET num_visits = ?, last_visit_ts = ? WHERE url = ?;', [num_visits, ts, url])
+    if (!url.startsWith('beaker://')) { // dont log stats on internal sites, keep them out of the search
+      // get current stats
+      var stats = await db.get('SELECT * FROM visit_stats WHERE url = ?;', [url])
+
+      // create or update stats
+      if (!stats) {
+        await db.run('INSERT INTO visit_stats (url, num_visits, last_visit_ts) VALUES (?, ?, ?);', [url, 1, ts])
+        await db.run('INSERT INTO visit_fts (url, title) VALUES (?, ?);', [url, title])
+      } else {
+        let num_visits = (+stats.num_visits || 1) + 1
+        await db.run('UPDATE visit_stats SET num_visits = ?, last_visit_ts = ? WHERE url = ?;', [num_visits, ts, url])
+      }
     }
 
     // visited within 1 hour?

From 05e79b70551eece2b14ed3da5e73a61e370f995a Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 16 Apr 2019 16:29:05 -0500
Subject: [PATCH 151/245] Fix bug in fallback pages

---
 dat/protocol.js | 27 ++++++++++++++-------------
 1 file changed, 14 insertions(+), 13 deletions(-)

diff --git a/dat/protocol.js b/dat/protocol.js
index 91ef8ed5..f5985370 100644
--- a/dat/protocol.js
+++ b/dat/protocol.js
@@ -240,6 +240,14 @@ exports.electronHandler = async function (request, respond) {
     }
   }
 
+  // check for a fallback page
+  const useFallback = Boolean(manifest && manifest.fallback_page && !urlp.query.disable_fallback_page)
+  if (useFallback && (!entry || entry.isDirectory())) {
+    let tmp = entry; entry = null
+    await tryStat(manifest.fallback_page)
+    if (!entry) entry = tmp
+  }
+
   // handle folder
   if (entry && entry.isDirectory()) {
     cleanup()
@@ -273,19 +281,12 @@ exports.electronHandler = async function (request, respond) {
 
   // handle not found
   if (!entry) {
-    // check for a fallback page
-    if (manifest && manifest.fallback_page && !urlp.query.disable_fallback_page) {
-      await tryStat(manifest.fallback_page)
-    }
-
-    if (!entry) {
-      cleanup()
-      return respondError(404, 'File Not Found', {
-        errorDescription: 'File Not Found',
-        errorInfo: `Beaker could not find the file ${urlp.path}`,
-        title: 'File Not Found'
-      })
-    }
+    cleanup()
+    return respondError(404, 'File Not Found', {
+      errorDescription: 'File Not Found',
+      errorInfo: `Beaker could not find the file ${urlp.path}`,
+      title: 'File Not Found'
+    })
   }
 
   // TODO

From 7680b213d128fff737c76653a5fd225b45e20221 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 16 Apr 2019 21:54:41 -0500
Subject: [PATCH 152/245] Add unwalled.garden/reactions

---
 crawler/index.js                              |   4 +-
 crawler/json-schemas/reaction.js              | 475 ++++++++++++++++++
 crawler/reactions.js                          | 267 ++++++++++
 crawler/util.js                               |  16 +
 dbs/profile-data-db.js                        |   3 +-
 dbs/schemas/profile-data.sql.js               |  16 +-
 dbs/schemas/profile-data.v25.sql.js           |  18 +
 package-lock.json                             |  10 +-
 scripts/import-schemas.js                     |   3 +-
 web-apis/bg.js                                |   3 +
 web-apis/bg/unwalled-garden-posts.js          |  22 +-
 web-apis/bg/unwalled-garden-reactions.js      | 119 +++++
 web-apis/fg/navigator-import.js               |   4 +
 .../external/unwalled-garden-reactions.js     |   5 +
 14 files changed, 954 insertions(+), 11 deletions(-)
 create mode 100644 crawler/json-schemas/reaction.js
 create mode 100644 crawler/reactions.js
 create mode 100644 dbs/schemas/profile-data.v25.sql.js
 create mode 100644 web-apis/bg/unwalled-garden-reactions.js
 create mode 100644 web-apis/manifests/external/unwalled-garden-reactions.js

diff --git a/crawler/index.js b/crawler/index.js
index d1e52b47..52425eb4 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -10,6 +10,7 @@ const {crawlerEvents, toHostname} = require('./util')
 const posts = require('./posts')
 const bookmarks = require('./bookmarks')
 const graph = require('./graph')
+const reactions = require('./reactions')
 const siteDescriptions = require('./site-descriptions')
 
 // globals
@@ -23,6 +24,7 @@ var watches = {}
 exports.posts = posts
 exports.bookmarks = bookmarks
 exports.graph = graph
+exports.reactions = reactions
 exports.siteDescriptions = siteDescriptions
 const createEventsStream = exports.createEventsStream = () => emitStream(crawlerEvents)
 
@@ -86,6 +88,7 @@ exports.crawlSite = async function (archive) {
       posts.crawlSite(archive, crawlSource),
       bookmarks.crawlSite(archive, crawlSource),
       graph.crawlSite(archive, crawlSource),
+      reactions.crawlSite(archive, crawlSource),
       siteDescriptions.crawlSite(archive, crawlSource)
     ])
   } catch (err) {
@@ -129,7 +132,6 @@ exports.resetSite = async function (url) {
 
 exports.WEBAPI = {
   listSuggestions: require('./search').listSuggestions,
-  listSearchResults: require('./search').listSearchResults,
   createEventsStream,
   getCrawlStates,
   crawlSite: async (url) => {
diff --git a/crawler/json-schemas/reaction.js b/crawler/json-schemas/reaction.js
new file mode 100644
index 00000000..c3a6178b
--- /dev/null
+++ b/crawler/json-schemas/reaction.js
@@ -0,0 +1,475 @@
+module.exports = {
+  '$schema': 'http://json-schema.org/draft-07/schema#',
+  '$id': 'dat://unwalled.garden/reaction.json',
+  'type': 'object',
+  'title': 'Reaction',
+  'description': 'An emoji annotation on some resource.',
+  'required': [
+    'type',
+    'topic',
+    'emojis'
+  ],
+  'properties': {
+    'type': {
+      'type': 'string',
+      'description': "The object's type",
+      'const': 'unwalled.garden/reaction'
+    },
+    'topic': {
+      'type': 'string',
+      'description': 'What this reaction is about',
+      'format': 'uri',
+      'examples': [
+        'dat://beakerbrowser.com'
+      ]
+    },
+    'emojis': {
+      'type': 'array',
+      'description': 'The reaction emojis. Must contain supported emojis.',
+      'items': {
+        'type': 'string',
+        'enum': [
+          '🙂',
+          '😀',
+          '😃',
+          '😄',
+          '😁',
+          '😆',
+          '😅',
+          '😂',
+          '😉',
+          '😊',
+          '😇',
+          '🙃',
+          '😍',
+          '😘',
+          '😗',
+          '😚',
+          '😙',
+          '😋',
+          '😛',
+          '😜',
+          '😝',
+          '😐',
+          '😑',
+          '😶',
+          '😏',
+          '😒',
+          '😬',
+          '😌',
+          '😔',
+          '😪',
+          '😴',
+          '😷',
+          '😵',
+          '😎',
+          '😕',
+          '😟',
+          '😮',
+          '😯',
+          '😲',
+          '😳',
+          '😦',
+          '😧',
+          '😨',
+          '😰',
+          '😥',
+          '😢',
+          '😭',
+          '😱',
+          '😖',
+          '😣',
+          '😞',
+          '😓',
+          '😩',
+          '😫',
+          '😤',
+          '😡',
+          '😠',
+          '😈',
+          '👿',
+          '💀',
+          '💩',
+          '👺',
+          '👻',
+          '👾',
+          '🙈',
+          '🙉',
+          '🙊',
+          '❤',
+          '💛',
+          '💚',
+          '💙',
+          '💜',
+          '💘',
+          '💖',
+          '💗',
+          '💕',
+          '💔',
+          '👋',
+          '✋',
+          '👌',
+          '✌',
+          '👈',
+          '👉',
+          '👆',
+          '👇',
+          '☝',
+          '👍',
+          '👎',
+          '✊',
+          '👊',
+          '👏',
+          '🙌',
+          '👐',
+          '🙏',
+          '💅',
+          '💪',
+          '⚠',
+          '🚫',
+          '⬆',
+          '⬇',
+          '🔜',
+          '🔝',
+          '♻',
+          '✅',
+          '✔',
+          '❌',
+          '⁉',
+          '❓',
+          '❗',
+          '🅰',
+          '🅱',
+          '🆒',
+          '🆓',
+          'ℹ',
+          '🆕',
+          '🆗',
+          '🆘',
+          '💋',
+          '💯',
+          '💢',
+          '💥',
+          '💫',
+          '💦',
+          '💨',
+          '💣',
+          '💬',
+          '💭',
+          '💤',
+          '👂',
+          '👃',
+          '👀',
+          '👅',
+          '👄',
+          '🙅',
+          '🙆',
+          '💁',
+          '🙋',
+          '🙇',
+          '👸',
+          '👰',
+          '👼',
+          '🎅',
+          '💇',
+          '🏃',
+          '💃',
+          '👯',
+          '🏇',
+          '🏄',
+          '👭',
+          '👫',
+          '👬',
+          '💏',
+          '💑',
+          '👪',
+          '👽',
+          '👣',
+          '🐞',
+          '🌱',
+          '🌲',
+          '🍀',
+          '🍁',
+          '🍔',
+          '🍕',
+          '🍚',
+          '🍩',
+          '🍪',
+          '🎂',
+          '☕',
+          '🍷',
+          '🍸',
+          '🍺',
+          '🍻',
+          '🌍',
+          '🌎',
+          '🌏',
+          '🌐',
+          '🚑',
+          '🚒',
+          '🚓',
+          '🚜',
+          '🚨',
+          '🚦',
+          '🚧',
+          '⚓',
+          '✈',
+          null,
+          '🚀',
+          '⏳',
+          '⏰',
+          '🌙',
+          '☀',
+          '⭐',
+          '🌟',
+          '🌈',
+          '☔',
+          '⚡',
+          '❄',
+          '⛄',
+          '🔥',
+          '💧',
+          '🌊',
+          '🎃',
+          '🎄',
+          '✨',
+          '🎈',
+          '🎉',
+          '🎊',
+          '🎏',
+          '🎀',
+          '🎁',
+          '🏆',
+          '🎯',
+          '🎱',
+          '🔮',
+          '🎮',
+          '🎰',
+          '🎲',
+          '🎭',
+          '🎨',
+          '👓',
+          '👔',
+          '👠',
+          '👑',
+          '🎩',
+          '🎓',
+          '💄',
+          '💍',
+          '💎',
+          '📢',
+          '🎵',
+          '🎶',
+          '🎤',
+          '🎷',
+          '🎸',
+          '🎺',
+          '🔋',
+          '🔌',
+          '💾',
+          '💡',
+          '🔦',
+          '📖',
+          '📚',
+          '📰',
+          '💰',
+          '💴',
+          '💵',
+          '💶',
+          '💷',
+          '💸',
+          '💲',
+          '📦',
+          '📈',
+          '📉',
+          '📌',
+          '🔒',
+          '🔑',
+          '🔨',
+          '🔫',
+          '🔧',
+          '🔬',
+          '🔭',
+          '📡',
+          '💉',
+          '💊',
+          '🚽',
+          '🚬',
+          '🏁',
+          '🚩',
+          '👋🏻',
+          '✋🏻',
+          '👌🏻',
+          '✌🏻',
+          '👈🏻',
+          '👉🏻',
+          '👆🏻',
+          '👇🏻',
+          '☝🏻',
+          '👍🏻',
+          '👎🏻',
+          '✊🏻',
+          '👊🏻',
+          '👏🏻',
+          '🙌🏻',
+          '👐🏻',
+          '🙏🏻',
+          '💅🏻',
+          '💪🏻',
+          '👂🏻',
+          '👃🏻',
+          '🙅🏻',
+          '🙆🏻',
+          '💁🏻',
+          '🙋🏻',
+          '🙇🏻',
+          '👸🏻',
+          '👰🏻',
+          '👼🏻',
+          '🎅🏻',
+          '💇🏻',
+          '🏃🏻',
+          '💃🏻',
+          '🏄🏻',
+          '👋🏼',
+          '✋🏼',
+          '👌🏼',
+          '✌🏼',
+          '👈🏼',
+          '👉🏼',
+          '👆🏼',
+          '👇🏼',
+          '☝🏼',
+          '👍🏼',
+          '👎🏼',
+          '✊🏼',
+          '👊🏼',
+          '👏🏼',
+          '🙌🏼',
+          '👐🏼',
+          '🙏🏼',
+          '💅🏼',
+          '💪🏼',
+          '👂🏼',
+          '👃🏼',
+          '🙅🏼',
+          '🙆🏼',
+          '💁🏼',
+          '🙋🏼',
+          '🙇🏼',
+          '👸🏼',
+          '👰🏼',
+          '👼🏼',
+          '🎅🏼',
+          '💇🏼',
+          '🏃🏼',
+          '💃🏼',
+          '🏄🏼',
+          '👋🏽',
+          '✋🏽',
+          '👌🏽',
+          '✌🏽',
+          '👈🏽',
+          '👉🏽',
+          '👆🏽',
+          '👇🏽',
+          '☝🏽',
+          '👍🏽',
+          '👎🏽',
+          '✊🏽',
+          '👊🏽',
+          '👏🏽',
+          '🙌🏽',
+          '👐🏽',
+          '🙏🏽',
+          '💅🏽',
+          '💪🏽',
+          '👂🏽',
+          '👃🏽',
+          '🙅🏽',
+          '🙆🏽',
+          '💁🏽',
+          '🙋🏽',
+          '🙇🏽',
+          '👸🏽',
+          '👰🏽',
+          '👼🏽',
+          '🎅🏽',
+          '💇🏽',
+          '🏃🏽',
+          '💃🏽',
+          '🏄🏽',
+          '👋🏾',
+          '✋🏾',
+          '👌🏾',
+          '✌🏾',
+          '👈🏾',
+          '👉🏾',
+          '👆🏾',
+          '👇🏾',
+          '☝🏾',
+          '👍🏾',
+          '👎🏾',
+          '✊🏾',
+          '👊🏾',
+          '👏🏾',
+          '🙌🏾',
+          '👐🏾',
+          '🙏🏾',
+          '💅🏾',
+          '💪🏾',
+          '👂🏾',
+          '👃🏾',
+          '🙅🏾',
+          '🙆🏾',
+          '💁🏾',
+          '🙋🏾',
+          '🙇🏾',
+          '👸🏾',
+          '👰🏾',
+          '👼🏾',
+          '🎅🏾',
+          '💇🏾',
+          '🏃🏾',
+          '💃🏾',
+          '🏄🏾',
+          '👋🏿',
+          '✋🏿',
+          '👌🏿',
+          '✌🏿',
+          '👈🏿',
+          '👉🏿',
+          '👆🏿',
+          '👇🏿',
+          '☝🏿',
+          '👍🏿',
+          '👎🏿',
+          '✊🏿',
+          '👊🏿',
+          '👏🏿',
+          '🙌🏿',
+          '👐🏿',
+          '🙏🏿',
+          '💅🏿',
+          '💪🏿',
+          '👂🏿',
+          '👃🏿',
+          '🙅🏿',
+          '🙆🏿',
+          '💁🏿',
+          '🙋🏿',
+          '🙇🏿',
+          '👸🏿',
+          '👰🏿',
+          '👼🏿',
+          '🎅🏿',
+          '💇🏿',
+          '🏃🏿',
+          '💃🏿',
+          '🏄🏿'
+        ]
+      }
+    }
+  },
+  'additionalProperties': false
+}
\ No newline at end of file
diff --git a/crawler/reactions.js b/crawler/reactions.js
new file mode 100644
index 00000000..67abc4bd
--- /dev/null
+++ b/crawler/reactions.js
@@ -0,0 +1,267 @@
+const {URL} = require('url')
+const Events = require('events')
+const Ajv = require('ajv')
+const logger = require('../logger').child({category: 'crawler', dataset: 'reactions'})
+const db = require('../dbs/profile-data-db')
+const crawler = require('./index')
+const lock = require('../lib/lock')
+const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, ensureDirectory, slugifyUrl} = require('./util')
+const reactionSchema = require('./json-schemas/reaction')
+
+// constants
+// =
+
+const TABLE_VERSION = 1
+const JSON_TYPE = 'unwalled.garden/reaction'
+const JSON_PATH_REGEX = /^\/data\/reactions\/([^/]+)\.json$/i
+
+// typedefs
+// =
+
+/**
+ * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
+ * @typedef {import('./util').CrawlSourceRecord} CrawlSourceRecord
+ *
+ * @typedef {Object} Reaction
+ * @prop {string} emoji
+ * @prop {string[]} authors
+ */
+
+// globals
+// =
+
+const events = new Events()
+const ajv = (new Ajv())
+const validateReaction = ajv.compile(reactionSchema)
+
+// exported api
+// =
+
+exports.on = events.on.bind(events)
+exports.addListener = events.addListener.bind(events)
+exports.removeListener = events.removeListener.bind(events)
+
+/**
+ * @description
+ * Crawl the given site for reactions.
+ *
+ * @param {InternalDatArchive} archive - site to crawl.
+ * @param {CrawlSourceRecord} crawlSource - internal metadata about the crawl target.
+ * @returns {Promise}
+ */
+exports.crawlSite = async function (archive, crawlSource) {
+  return doCrawl(archive, crawlSource, 'crawl_reactions', TABLE_VERSION, async ({changes, resetRequired}) => {
+    const supressEvents = resetRequired === true // dont emit when replaying old info
+    logger.silly('Crawling reactions', {details: {url: archive.url, numChanges: changes.length, resetRequired}})
+    if (resetRequired) {
+      // reset all data
+      logger.debug('Resetting dataset', {details: {url: archive.url}})
+      await db.run(`
+        DELETE FROM crawl_reactions WHERE crawlSourceId = ?
+      `, [crawlSource.id])
+      await doCheckpoint('crawl_reactions', TABLE_VERSION, crawlSource, 0)
+    }
+
+    // collect changed reactions
+    var changedReactions = getMatchingChangesInOrder(changes, JSON_PATH_REGEX)
+    if (changedReactions.length) {
+      logger.verbose('Collected new/changed reaction files', {details: {url: archive.url, changedReactions: changedReactions.map(p => p.name)}})
+    } else {
+      logger.debug('No new reaction-files found', {details: {url: archive.url}})
+    }
+    emitProgressEvent(archive.url, 'crawl_reactions', 0, changedReactions.length)
+
+    // read and apply each reaction in order
+    var progress = 0
+    for (let changedReaction of changedReactions) {
+      // TODO Currently the crawler will abort reading the feed if any reaction fails to load
+      //      this means that a single unreachable file can stop the forward progress of reaction indexing
+      //      to solve this, we need to find a way to tolerate unreachable reaction-files without losing our ability to efficiently detect new reactions
+      //      -prf
+      if (changedReaction.type === 'del') {
+        // delete
+        await db.run(`
+          DELETE FROM crawl_reactions WHERE crawlSourceId = ? AND pathname = ?
+        `, [crawlSource.id, changedReaction.name])
+        events.emit('reaction-updated', archive.url)
+      } else {
+        // read
+        let fileString
+        try {
+          fileString = await archive.pda.readFile(changedReaction.name, 'utf8')
+        } catch (err) {
+          logger.warn('Failed to read reaction file, aborting', {details: {url: archive.url, name: changedReaction.name, err}})
+          return // abort indexing
+        }
+
+        // parse and validate
+        let reaction
+        try {
+          reaction = JSON.parse(fileString)
+          let valid = validateReaction(reaction)
+          if (!valid) throw ajv.errorsText(validateReaction.errors)
+        } catch (err) {
+          logger.warn('Failed to parse reaction file, skipping', {details: {url: archive.url, name: changedReaction.name, err}})
+          continue // skip
+        }
+
+        // massage record
+        reaction.topic = normalizeTopicUrl(reaction.topic)
+
+        // upsert
+        await db.run(`
+          INSERT OR REPLACE INTO crawl_reactions (crawlSourceId, pathname, crawledAt, topic, emojis)
+            VALUES (?, ?, ?, ?, ?)
+        `, [crawlSource.id, changedReaction.name, Date.now(), reaction.topic, reaction.emojis.join(',')])
+        events.emit('reaction-updated', archive.url)
+      }
+
+      // checkpoint our progress
+      logger.silly(`Finished crawling reactions`, {details: {url: archive.url}})
+      await doCheckpoint('crawl_reactions', TABLE_VERSION, crawlSource, changedReaction.version)
+      emitProgressEvent(archive.url, 'crawl_reactions', ++progress, changedReactions.length)
+    }
+  })
+}
+
+/**
+ * @description
+ * List crawled reactions.
+ *
+ * @param {string} url - The URL of the topic
+ * @returns {Promise<Reaction[]>}
+ */
+const listReactions = exports.listReactions = async function (topic) {
+  // validate params
+  try { new URL(topic) }
+  catch (e) { throw new Error('Invalid URL: ' + topic) }
+
+  // execute query
+  var rows = await db.all(`
+    SELECT
+        crawl_reactions.*, src.url AS crawlSourceUrl
+      FROM crawl_reactions
+      INNER JOIN crawl_sources src ON src.id = crawl_reactions.crawlSourceId
+      WHERE
+        crawl_reactions.topic = ?
+  `, [topic])
+
+  console.log(topic, rows)
+
+  // construct reactions list
+  var reactions = {}
+  rows.forEach(row => {
+    row.emojis.split(',').forEach(emoji => {
+      if (!reactions[emoji]) {
+        reactions[emoji] = {emoji, authors: [row.crawlSourceUrl]}
+      } else {
+        reactions[emoji].authors.push(row.crawlSourceUrl)
+      }
+    })
+  })
+
+  console.log(reactions)
+
+  return Object.values(reactions)
+}
+
+/**
+ * @description
+ * Create a new reaction.
+ *
+ * @param {InternalDatArchive} archive - where to write the reaction to.
+ * @param {string} topic
+ * @param {string} emoji
+ * @returns {Promise<void>}
+ */
+exports.addReaction = async function (archive, topic, emoji) {
+  var valid = validateReaction({type: JSON_TYPE, topic, emojis: [emoji]})
+  if (!valid) throw ajv.errorsText(validateReaction.errors)
+
+  var filepath = `/data/reactions/${slugifyUrl(topic)}.json`
+  await ensureDirectory(archive, '/data')
+  await ensureDirectory(archive, '/data/reactions')
+  await updateReactionFile(archive, filepath, topic, emoji, false)
+  await crawler.crawlSite(archive)
+}
+
+/**
+ * @description
+ * Delete an existing reaction
+ *
+ * @param {InternalDatArchive} archive - where to write the reaction to.
+ * @param {string} topic
+ * @param {string} emoji
+ * @returns {Promise<void>}
+ */
+exports.deleteReaction = async function (archive, topic, emoji) {
+  var valid = validateReaction({type: JSON_TYPE, topic, emojis: [emoji]})
+  if (!valid) throw ajv.errorsText(validateReaction.errors)
+
+  var filepath = `/data/reactions/${slugifyUrl(topic)}.json`
+  await updateReactionFile(archive, filepath, topic, false, emoji)
+  await crawler.crawlSite(archive)
+}
+
+// internal methods
+// =
+
+function normalizeTopicUrl (url) {
+  try {
+    url = new URL(url)
+    return (url.protocol + '//' + url.hostname + url.pathname + url.search + url.hash).replace(/([/]$)/g, '')
+  } catch (e) {}
+  return null
+}
+
+/**
+ * @param {InternalDatArchive} archive
+ * @param {string} pathname
+ * @returns {Promise<Object>}
+ */
+async function readReactionFile (archive, pathname) {
+  try {
+    var json = await archive.pda.readFile(pathname, 'utf8')
+    json = JSON.parse(json)
+    var valid = validateReaction(json)
+    if (!valid) throw ajv.errorsText(validateReaction.errors)
+    return json
+  } catch (e) {
+    // fallback to an empty on error
+    return {
+      type: JSON_TYPE,
+      topic: '',
+      emojis: []
+    }
+  }
+}
+
+/**
+ * @param {InternalDatArchive} archive
+ * @param {string} pathname
+ * @param {string} topic
+ * @param {string|boolean} addEmoji
+ * @param {string|boolean} removeEmoji
+ * @returns {Promise<void>}
+ */
+async function updateReactionFile (archive, pathname, topic, addEmoji = false, removeEmoji = false) {
+  var release = await lock('crawler:reactions:' + archive.url)
+  try {
+    // read the reaction file
+    var reactionJson = await readReactionFile(archive, pathname)
+
+    // apply update
+    reactionJson.topic = topic
+    if (addEmoji) reactionJson.emojis = Array.from(new Set(reactionJson.emojis.concat([addEmoji])))
+    if (removeEmoji) reactionJson.emojis = reactionJson.emojis.filter(v => v !== removeEmoji)
+
+    // write or delete the reaction file
+    if (reactionJson.emojis.length) {
+      await archive.pda.writeFile(pathname, JSON.stringify(reactionJson, null, 2), 'utf8')
+    } else {
+      await archive.pda.unlink(pathname)
+    }
+  } finally {
+    release()
+  }
+}
diff --git a/crawler/util.js b/crawler/util.js
index a7d7a974..f0d62fba 100644
--- a/crawler/util.js
+++ b/crawler/util.js
@@ -175,3 +175,19 @@ exports.getSiteDescriptionThumbnailUrl = function (author, subject) {
     ? `${subject}/thumb` // self-description, use their own thumb
     : `${author}/data/known-sites/${toHostname(subject)}/thumb` // use captured thumb
 }
+
+/**
+ * @param {string} url
+ * @returns {string}
+ */
+var reservedChars = /[<>:"/\\|?*\x00-\x1F]/g
+var endingDashes = /([-]+$)/g
+exports.slugifyUrl = function (str) {
+  try {
+    let url = new URL(str)
+    str = url.protocol + url.hostname + url.pathname + url.search + url.hash
+  } catch (e) {
+    // ignore
+  }
+  return str.replace(reservedChars, '-').replace(endingDashes, '')
+}
\ No newline at end of file
diff --git a/dbs/profile-data-db.js b/dbs/profile-data-db.js
index d355f8b4..57755a57 100644
--- a/dbs/profile-data-db.js
+++ b/dbs/profile-data-db.js
@@ -111,7 +111,8 @@ migrations = [
   migration('profile-data.v21.sql'),
   migration('profile-data.v22.sql', {canFail: true}), // canFail for the same reason as v16, ffs
   migration('profile-data.v23.sql'),
-  migration('profile-data.v24.sql')
+  migration('profile-data.v24.sql'),
+  migration('profile-data.v25.sql')
 ]
 function migration (file, opts = {}) {
   return cb => {
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index 85b06732..203d2284 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -183,6 +183,20 @@ CREATE TRIGGER crawl_posts_au AFTER UPDATE ON crawl_posts BEGIN
   INSERT INTO crawl_posts_fts_index(rowid, body) VALUES (new.rowid, new.body);
 END;
 
+-- crawled reactions
+CREATE TABLE crawl_reactions (
+  crawlSourceId INTEGER NOT NULL,
+  pathname TEXT NOT NULL,
+  crawledAt INTEGER,
+  
+  topic TEXT NOT NULL,
+  emojis TEXT NOT NULL,
+
+  PRIMARY KEY (crawlSourceId, pathname),
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+CREATE INDEX crawl_reactions_topic ON crawl_reactions (topic);
+
 -- crawled bookmarks
 CREATE TABLE crawl_bookmarks (
   crawlSourceId INTEGER NOT NULL,
@@ -286,5 +300,5 @@ INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Address book', 'beaker://library/?view=addressbook', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker.Social', 'dat://beaker.social', 1);
 
-PRAGMA user_version = 24;
+PRAGMA user_version = 25;
 `
diff --git a/dbs/schemas/profile-data.v25.sql.js b/dbs/schemas/profile-data.v25.sql.js
new file mode 100644
index 00000000..622ebc64
--- /dev/null
+++ b/dbs/schemas/profile-data.v25.sql.js
@@ -0,0 +1,18 @@
+module.exports = `
+
+-- crawled reactions
+CREATE TABLE crawl_reactions (
+  crawlSourceId INTEGER NOT NULL,
+  pathname TEXT NOT NULL,
+  crawledAt INTEGER,
+  
+  topic TEXT NOT NULL,
+  emojis TEXT NOT NULL,
+
+  PRIMARY KEY (crawlSourceId, pathname),
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+CREATE INDEX crawl_reactions_topic ON crawl_reactions (topic);
+
+PRAGMA user_version = 25;
+`
diff --git a/package-lock.json b/package-lock.json
index 5b6b1fd0..7d285eef 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -482,7 +482,7 @@
     },
     "buffer-equals": {
       "version": "1.0.4",
-      "resolved": "https://registry.npmjs.org/buffer-equals/-/buffer-equals-1.0.4.tgz",
+      "resolved": "http://registry.npmjs.org/buffer-equals/-/buffer-equals-1.0.4.tgz",
       "integrity": "sha1-A1O1T9B/2VZBcGca5vZrnPENJ/U="
     },
     "buffer-fill": {
@@ -1043,7 +1043,7 @@
     },
     "dns-packet": {
       "version": "4.2.0",
-      "resolved": "https://registry.npmjs.org/dns-packet/-/dns-packet-4.2.0.tgz",
+      "resolved": "http://registry.npmjs.org/dns-packet/-/dns-packet-4.2.0.tgz",
       "integrity": "sha512-bn1AKpfkFbm0MIioOMHZ5qJzl2uypdBwI4nYNsqvhjsegBhcKJUlCrMPWLx6JEezRjxZmxhtIz/FkBEur2l8Cw==",
       "requires": {
         "ip": "^1.1.5",
@@ -4209,7 +4209,7 @@
       "dependencies": {
         "nan": {
           "version": "2.10.0",
-          "resolved": "https://registry.npmjs.org/nan/-/nan-2.10.0.tgz",
+          "resolved": "http://registry.npmjs.org/nan/-/nan-2.10.0.tgz",
           "integrity": "sha512-bAdJv7fBLhWC+/Bls0Oza+mvTaNQtP+1RyhhhvD95pgUJz6XM5IzgmxOkItJ9tkoCiplvAnXI1tNmmUD/eScyA=="
         }
       }
@@ -4295,7 +4295,7 @@
     },
     "string-width": {
       "version": "1.0.2",
-      "resolved": "https://registry.npmjs.org/string-width/-/string-width-1.0.2.tgz",
+      "resolved": "http://registry.npmjs.org/string-width/-/string-width-1.0.2.tgz",
       "integrity": "sha1-EYvfW4zcUaKn5w0hHgfisLmxB9M=",
       "requires": {
         "code-point-at": "^1.0.0",
@@ -4484,7 +4484,7 @@
     },
     "thunky": {
       "version": "0.1.0",
-      "resolved": "https://registry.npmjs.org/thunky/-/thunky-0.1.0.tgz",
+      "resolved": "http://registry.npmjs.org/thunky/-/thunky-0.1.0.tgz",
       "integrity": "sha1-vzAUaCTituZ7Dy16Ssi+smkIaE4="
     },
     "tildify": {
diff --git a/scripts/import-schemas.js b/scripts/import-schemas.js
index 62285a6d..703be918 100644
--- a/scripts/import-schemas.js
+++ b/scripts/import-schemas.js
@@ -7,7 +7,8 @@ const SCHEMAS = [
   'comment',
   'follows',
   'post',
-  'bookmark'
+  'bookmark',
+  'reaction'
 ]
 
 console.log('')
diff --git a/web-apis/bg.js b/web-apis/bg.js
index 8b05a50e..78935cc2 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -31,6 +31,7 @@ const profilesManifest = require('./manifests/external/profiles')
 const searchManifest = require('./manifests/external/search')
 const postsManifest = require('./manifests/external/unwalled-garden-posts')
 const graphManifest = require('./manifests/external/unwalled-garden-graph')
+const reactionsManifest = require('./manifests/external/unwalled-garden-reactions')
 
 // external apis
 const datArchiveAPI = require('./bg/dat-archive')
@@ -41,6 +42,7 @@ const profilesAPI = require('./bg/profiles')
 const searchAPI = require('./bg/search')
 const postsAPI = require('./bg/unwalled-garden-posts')
 const graphAPI = require('./bg/unwalled-garden-graph')
+const reactionsAPI = require('./bg/unwalled-garden-reactions')
 
 // experimental manifests
 const experimentalCapturePageManifest = require('./manifests/external/experimental/capture-page')
@@ -76,6 +78,7 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('search', searchManifest, searchAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-posts', postsManifest, postsAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-graph', graphManifest, graphAPI, secureOnly)
+  globals.rpcAPI.exportAPI('unwalled-garden-reactions', reactionsManifest, reactionsAPI, secureOnly)
 
   // experimental apis
   globals.rpcAPI.exportAPI('experimental-capture-page', experimentalCapturePageManifest, experimentalCapturePageAPI, secureOnly)
diff --git a/web-apis/bg/unwalled-garden-posts.js b/web-apis/bg/unwalled-garden-posts.js
index 96d0cee2..30f224ee 100644
--- a/web-apis/bg/unwalled-garden-posts.js
+++ b/web-apis/bg/unwalled-garden-posts.js
@@ -4,6 +4,7 @@ const {URL} = require('url')
 const {PermissionsError} = require('beaker-error-constants')
 const dat = require('../../dat')
 const postsCrawler = require('../../crawler/posts')
+const reactionsAPI = require('./unwalled-garden-reactions')
 
 // typedefs
 // =
@@ -15,10 +16,19 @@ const postsCrawler = require('../../crawler/posts')
  * @prop {string} description
  * @prop {string[]} type
  *
+ * @typedef {Object} PostReactionAuthorPublicAPIRecord
+ * @prop {string} url
+ * @prop {string} title
+ *
+ * @typedef {Object} PostReactionPublicAPIRecord
+ * @prop {string} emoji
+ * @prop {PostReactionAuthorPublicAPIRecord[]} authors
+ *
  * @typedef {Object} PostPublicAPIRecord
  * @prop {string} url
  * @prop {Object} content
  * @prop {string} content.body
+ * @prop {PostReactionPublicAPIRecord[]} reactions
  * @prop {number} crawledAt
  * @prop {number} createdAt
  * @prop {number} updatedAt
@@ -167,12 +177,20 @@ async function urlToFilepath (url, origin) {
   return filepath
 }
 
-function massagePostRecord (post) {
+async function massagePostRecord (post) {
+  var url =  post.author.url + post.pathname
   return {
-    url: post.author.url + post.pathname,
+    url,
     content: {
       body: post.content.body
     },
+    reactions: (await reactionsAPI.innerListReactions(url)).map(r => ({
+      emoji: r.emoji,
+      authors: r.authors.map(a => ({
+        url: a.url,
+        title: a.title
+      }))
+    })),
     crawledAt: post.crawledAt,
     createdAt: post.createdAt,
     updatedAt: post.updatedAt,
diff --git a/web-apis/bg/unwalled-garden-reactions.js b/web-apis/bg/unwalled-garden-reactions.js
new file mode 100644
index 00000000..c1a42d7f
--- /dev/null
+++ b/web-apis/bg/unwalled-garden-reactions.js
@@ -0,0 +1,119 @@
+const globals = require('../../globals')
+const assert = require('assert')
+const {URL} = require('url')
+const {PermissionsError} = require('beaker-error-constants')
+const dat = require('../../dat')
+const reactionsCrawler = require('../../crawler/reactions')
+const siteDescriptionsCrawler = require('../../crawler/site-descriptions')
+
+// typedefs
+// =
+
+/**
+ * @typedef {Object} ReactionAuthorPublicAPIRecord
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {string[]} type
+ *
+ * @typedef {Object} ReactionPublicAPIRecord
+ * @prop {string} topic
+ * @prop {string} emoji
+ * @prop {ReactionAuthorPublicAPIRecord[]} authors
+ */
+
+// exported api
+// =
+
+/**
+ * @param {string} topic
+ * @returns {Promise<ReactionPublicAPIRecord[]>}
+ */
+async function innerListReactions (topic) {
+  var reactions = await reactionsCrawler.listReactions(topic)
+  return Promise.all(reactions.map(async (reaction) => ({
+    topic,
+    emoji: reaction.emoji,
+    authors: await Promise.all(reaction.authors.map(async (url) => {
+      var desc = await siteDescriptionsCrawler.getBest({subject: url})
+      return {
+        url: desc.url,
+        title: desc.title,
+        description: desc.description,
+        type: desc.type
+      }
+    }))
+  })))
+}
+
+module.exports = {
+  innerListReactions,
+
+  /**
+   * @param {string} topic
+   * @returns {Promise<ReactionPublicAPIRecord[]>}
+   */
+  async listReactions (topic) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+
+    topic = normalizeTopicUrl(topic)
+    assert(topic && typeof topic === 'string', 'The `topic` parameter must be a valid URL')
+
+    return innerListReactions(topic)
+  },
+
+  /**
+   * @param {string} topic
+   * @param {string} emoji
+   * @returns {Promise<void>}
+   */
+  async addReaction (topic, emoji) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+
+    topic = normalizeTopicUrl(topic)
+    assert(topic && typeof topic === 'string', 'The `topic` parameter must be a valid URL')
+
+    var userSession = globals.userSessionAPI.getFor(this.sender)
+    if (!userSession) throw new Error('No active user session')
+    var userArchive = dat.library.getArchive(userSession.url)
+
+    await reactionsCrawler.addReaction(userArchive, topic, emoji)
+  },
+
+  /**
+   * @param {string} topic
+   * @param {string} emoji
+   * @returns {Promise<void>}
+   */
+  async deleteReaction (topic, emoji) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+
+    topic = normalizeTopicUrl(topic)
+    assert(topic && typeof topic === 'string', 'The `topic` parameter must be a valid URL')
+
+    var userSession = globals.userSessionAPI.getFor(this.sender)
+    if (!userSession) throw new Error('No active user session')
+    var userArchive = dat.library.getArchive(userSession.url)
+
+    await reactionsCrawler.deleteReaction(userArchive, topic, emoji)
+  }
+}
+
+// internal methods
+// =
+
+async function assertPermission (sender, perm) {
+  if (sender.getURL().startsWith('beaker:')) {
+    return true
+  }
+  if (await globals.permsAPI.requestPermission(perm, sender)) return true
+  throw new PermissionsError()
+}
+
+function normalizeTopicUrl (url) {
+  try {
+    url = new URL(url)
+    return (url.protocol + '//' + url.hostname + url.pathname + url.search + url.hash).replace(/([/]$)/g, '')
+  } catch (e) {}
+  return null
+}
\ No newline at end of file
diff --git a/web-apis/fg/navigator-import.js b/web-apis/fg/navigator-import.js
index 69427e2e..3de01b6d 100644
--- a/web-apis/fg/navigator-import.js
+++ b/web-apis/fg/navigator-import.js
@@ -35,6 +35,10 @@ const APIs = {
   'unwalled-garden-graph': {
     manifest: require('../manifests/external/unwalled-garden-graph'),
     create: makeCreateFn('unwalled-garden-graph')
+  },
+  'unwalled-garden-reactions': {
+    manifest: require('../manifests/external/unwalled-garden-reactions'),
+    create: makeCreateFn('unwalled-garden-reactions')
   }
 }
 
diff --git a/web-apis/manifests/external/unwalled-garden-reactions.js b/web-apis/manifests/external/unwalled-garden-reactions.js
new file mode 100644
index 00000000..ff793f11
--- /dev/null
+++ b/web-apis/manifests/external/unwalled-garden-reactions.js
@@ -0,0 +1,5 @@
+module.exports = {
+  listReactions: 'promise',
+  addReaction: 'promise',
+  deleteReaction: 'promise'
+}
\ No newline at end of file

From 3d7ad4a643935fcd9a242538e907c371923786f6 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 17 Apr 2019 13:54:11 -0500
Subject: [PATCH 153/245] Expand supported reaction emojis

---
 crawler/json-schemas/reaction.js | 3820 ++++++++++++++++++++++++++++--
 crawler/reactions.js             |    6 +-
 2 files changed, 3611 insertions(+), 215 deletions(-)

diff --git a/crawler/json-schemas/reaction.js b/crawler/json-schemas/reaction.js
index c3a6178b..b27b7cf6 100644
--- a/crawler/json-schemas/reaction.js
+++ b/crawler/json-schemas/reaction.js
@@ -29,46 +29,79 @@ module.exports = {
       'items': {
         'type': 'string',
         'enum': [
-          '🙂',
           '😀',
           '😃',
           '😄',
           '😁',
           '😆',
           '😅',
+          '🤣',
           '😂',
+          '🙂',
+          '🙃',
           '😉',
           '😊',
           '😇',
-          '🙃',
+          '🥰',
           '😍',
+          '🤩',
           '😘',
           '😗',
+          '☺️',
+          '☺',
           '😚',
           '😙',
           '😋',
           '😛',
           '😜',
+          '🤪',
           '😝',
+          '🤑',
+          '🤗',
+          '🤭',
+          '🤫',
+          '🤔',
+          '🤐',
+          '🤨',
           '😐',
           '😑',
           '😶',
           '😏',
           '😒',
+          '🙄',
           '😬',
+          '🤥',
           '😌',
           '😔',
           '😪',
+          '🤤',
           '😴',
           '😷',
+          '🤒',
+          '🤕',
+          '🤢',
+          '🤮',
+          '🤧',
+          '🥵',
+          '🥶',
+          '🥴',
           '😵',
+          '🤯',
+          '🤠',
+          '🥳',
           '😎',
+          '🤓',
+          '🧐',
           '😕',
           '😟',
+          '🙁',
+          '☹️',
+          '☹',
           '😮',
           '😯',
           '😲',
           '😳',
+          '🥺',
           '😦',
           '😧',
           '😨',
@@ -83,390 +116,3755 @@ module.exports = {
           '😓',
           '😩',
           '😫',
+          '🥱',
           '😤',
           '😡',
           '😠',
+          '🤬',
           '😈',
           '👿',
           '💀',
+          '☠️',
+          '☠',
           '💩',
+          '🤡',
+          '👹',
           '👺',
           '👻',
+          '👽',
           '👾',
+          '🤖',
+          '😺',
+          '😸',
+          '😹',
+          '😻',
+          '😼',
+          '😽',
+          '🙀',
+          '😿',
+          '😾',
           '🙈',
           '🙉',
           '🙊',
-          '❤',
-          '💛',
-          '💚',
-          '💙',
-          '💜',
+          '💋',
+          '💌',
           '💘',
+          '💝',
           '💖',
           '💗',
+          '💓',
+          '💞',
           '💕',
+          '💟',
+          '❣️',
+          '❣',
           '💔',
+          '❤️',
+          '❤',
+          '🧡',
+          '💛',
+          '💚',
+          '💙',
+          '💜',
+          '🤎',
+          '🖤',
+          '🤍',
+          '💯',
+          '💢',
+          '💥',
+          '💫',
+          '💦',
+          '💨',
+          '🕳️',
+          '🕳',
+          '💣',
+          '💬',
+          '👁️‍🗨️',
+          '👁‍🗨️',
+          '👁️‍🗨',
+          '👁‍🗨',
+          '🗨️',
+          '🗨',
+          '🗯️',
+          '🗯',
+          '💭',
+          '💤',
           '👋',
+          '👋🏻',
+          '👋🏼',
+          '👋🏽',
+          '👋🏾',
+          '👋🏿',
+          '🤚',
+          '🤚🏻',
+          '🤚🏼',
+          '🤚🏽',
+          '🤚🏾',
+          '🤚🏿',
+          '🖐️',
+          '🖐',
+          '🖐🏻',
+          '🖐🏼',
+          '🖐🏽',
+          '🖐🏾',
+          '🖐🏿',
           '✋',
+          '✋🏻',
+          '✋🏼',
+          '✋🏽',
+          '✋🏾',
+          '✋🏿',
+          '🖖',
+          '🖖🏻',
+          '🖖🏼',
+          '🖖🏽',
+          '🖖🏾',
+          '🖖🏿',
           '👌',
+          '👌🏻',
+          '👌🏼',
+          '👌🏽',
+          '👌🏾',
+          '👌🏿',
+          '🤏',
+          '🤏🏻',
+          '🤏🏼',
+          '🤏🏽',
+          '🤏🏾',
+          '🤏🏿',
+          '✌️',
           '✌',
+          '✌🏻',
+          '✌🏼',
+          '✌🏽',
+          '✌🏾',
+          '✌🏿',
+          '🤞',
+          '🤞🏻',
+          '🤞🏼',
+          '🤞🏽',
+          '🤞🏾',
+          '🤞🏿',
+          '🤟',
+          '🤟🏻',
+          '🤟🏼',
+          '🤟🏽',
+          '🤟🏾',
+          '🤟🏿',
+          '🤘',
+          '🤘🏻',
+          '🤘🏼',
+          '🤘🏽',
+          '🤘🏾',
+          '🤘🏿',
+          '🤙',
+          '🤙🏻',
+          '🤙🏼',
+          '🤙🏽',
+          '🤙🏾',
+          '🤙🏿',
           '👈',
+          '👈🏻',
+          '👈🏼',
+          '👈🏽',
+          '👈🏾',
+          '👈🏿',
           '👉',
+          '👉🏻',
+          '👉🏼',
+          '👉🏽',
+          '👉🏾',
+          '👉🏿',
           '👆',
+          '👆🏻',
+          '👆🏼',
+          '👆🏽',
+          '👆🏾',
+          '👆🏿',
+          '🖕',
+          '🖕🏻',
+          '🖕🏼',
+          '🖕🏽',
+          '🖕🏾',
+          '🖕🏿',
           '👇',
+          '👇🏻',
+          '👇🏼',
+          '👇🏽',
+          '👇🏾',
+          '👇🏿',
+          '☝️',
           '☝',
+          '☝🏻',
+          '☝🏼',
+          '☝🏽',
+          '☝🏾',
+          '☝🏿',
           '👍',
+          '👍🏻',
+          '👍🏼',
+          '👍🏽',
+          '👍🏾',
+          '👍🏿',
           '👎',
+          '👎🏻',
+          '👎🏼',
+          '👎🏽',
+          '👎🏾',
+          '👎🏿',
           '✊',
+          '✊🏻',
+          '✊🏼',
+          '✊🏽',
+          '✊🏾',
+          '✊🏿',
           '👊',
+          '👊🏻',
+          '👊🏼',
+          '👊🏽',
+          '👊🏾',
+          '👊🏿',
+          '🤛',
+          '🤛🏻',
+          '🤛🏼',
+          '🤛🏽',
+          '🤛🏾',
+          '🤛🏿',
+          '🤜',
+          '🤜🏻',
+          '🤜🏼',
+          '🤜🏽',
+          '🤜🏾',
+          '🤜🏿',
           '👏',
+          '👏🏻',
+          '👏🏼',
+          '👏🏽',
+          '👏🏾',
+          '👏🏿',
           '🙌',
+          '🙌🏻',
+          '🙌🏼',
+          '🙌🏽',
+          '🙌🏾',
+          '🙌🏿',
           '👐',
+          '👐🏻',
+          '👐🏼',
+          '👐🏽',
+          '👐🏾',
+          '👐🏿',
+          '🤲',
+          '🤲🏻',
+          '🤲🏼',
+          '🤲🏽',
+          '🤲🏾',
+          '🤲🏿',
+          '🤝',
           '🙏',
+          '🙏🏻',
+          '🙏🏼',
+          '🙏🏽',
+          '🙏🏾',
+          '🙏🏿',
+          '✍️',
+          '✍',
+          '✍🏻',
+          '✍🏼',
+          '✍🏽',
+          '✍🏾',
+          '✍🏿',
           '💅',
+          '💅🏻',
+          '💅🏼',
+          '💅🏽',
+          '💅🏾',
+          '💅🏿',
+          '🤳',
+          '🤳🏻',
+          '🤳🏼',
+          '🤳🏽',
+          '🤳🏾',
+          '🤳🏿',
           '💪',
-          '⚠',
-          '🚫',
-          '⬆',
-          '⬇',
-          '🔜',
-          '🔝',
-          '♻',
-          '✅',
-          '✔',
-          '❌',
-          '⁉',
-          '❓',
-          '❗',
-          '🅰',
-          '🅱',
-          '🆒',
-          '🆓',
-          'ℹ',
-          '🆕',
-          '🆗',
-          '🆘',
-          '💋',
-          '💯',
-          '💢',
-          '💥',
-          '💫',
-          '💦',
-          '💨',
-          '💣',
-          '💬',
-          '💭',
-          '💤',
+          '💪🏻',
+          '💪🏼',
+          '💪🏽',
+          '💪🏾',
+          '💪🏿',
+          '🦾',
+          '🦿',
+          '🦵',
+          '🦵🏻',
+          '🦵🏼',
+          '🦵🏽',
+          '🦵🏾',
+          '🦵🏿',
+          '🦶',
+          '🦶🏻',
+          '🦶🏼',
+          '🦶🏽',
+          '🦶🏾',
+          '🦶🏿',
           '👂',
+          '👂🏻',
+          '👂🏼',
+          '👂🏽',
+          '👂🏾',
+          '👂🏿',
+          '🦻',
+          '🦻🏻',
+          '🦻🏼',
+          '🦻🏽',
+          '🦻🏾',
+          '🦻🏿',
           '👃',
+          '👃🏻',
+          '👃🏼',
+          '👃🏽',
+          '👃🏾',
+          '👃🏿',
+          '🧠',
+          '🦷',
+          '🦴',
           '👀',
+          '👁️',
+          '👁',
           '👅',
           '👄',
+          '👶',
+          '👶🏻',
+          '👶🏼',
+          '👶🏽',
+          '👶🏾',
+          '👶🏿',
+          '🧒',
+          '🧒🏻',
+          '🧒🏼',
+          '🧒🏽',
+          '🧒🏾',
+          '🧒🏿',
+          '👦',
+          '👦🏻',
+          '👦🏼',
+          '👦🏽',
+          '👦🏾',
+          '👦🏿',
+          '👧',
+          '👧🏻',
+          '👧🏼',
+          '👧🏽',
+          '👧🏾',
+          '👧🏿',
+          '🧑',
+          '🧑🏻',
+          '🧑🏼',
+          '🧑🏽',
+          '🧑🏾',
+          '🧑🏿',
+          '👱',
+          '👱🏻',
+          '👱🏼',
+          '👱🏽',
+          '👱🏾',
+          '👱🏿',
+          '👨',
+          '👨🏻',
+          '👨🏼',
+          '👨🏽',
+          '👨🏾',
+          '👨🏿',
+          '🧔',
+          '🧔🏻',
+          '🧔🏼',
+          '🧔🏽',
+          '🧔🏾',
+          '🧔🏿',
+          '👱‍♂️',
+          '👱‍♂',
+          '👱🏻‍♂️',
+          '👱🏻‍♂',
+          '👱🏼‍♂️',
+          '👱🏼‍♂',
+          '👱🏽‍♂️',
+          '👱🏽‍♂',
+          '👱🏾‍♂️',
+          '👱🏾‍♂',
+          '👱🏿‍♂️',
+          '👱🏿‍♂',
+          '👨‍🦰',
+          '👨🏻‍🦰',
+          '👨🏼‍🦰',
+          '👨🏽‍🦰',
+          '👨🏾‍🦰',
+          '👨🏿‍🦰',
+          '👨‍🦱',
+          '👨🏻‍🦱',
+          '👨🏼‍🦱',
+          '👨🏽‍🦱',
+          '👨🏾‍🦱',
+          '👨🏿‍🦱',
+          '👨‍🦳',
+          '👨🏻‍🦳',
+          '👨🏼‍🦳',
+          '👨🏽‍🦳',
+          '👨🏾‍🦳',
+          '👨🏿‍🦳',
+          '👨‍🦲',
+          '👨🏻‍🦲',
+          '👨🏼‍🦲',
+          '👨🏽‍🦲',
+          '👨🏾‍🦲',
+          '👨🏿‍🦲',
+          '👩',
+          '👩🏻',
+          '👩🏼',
+          '👩🏽',
+          '👩🏾',
+          '👩🏿',
+          '👱‍♀️',
+          '👱‍♀',
+          '👱🏻‍♀️',
+          '👱🏻‍♀',
+          '👱🏼‍♀️',
+          '👱🏼‍♀',
+          '👱🏽‍♀️',
+          '👱🏽‍♀',
+          '👱🏾‍♀️',
+          '👱🏾‍♀',
+          '👱🏿‍♀️',
+          '👱🏿‍♀',
+          '👩‍🦰',
+          '👩🏻‍🦰',
+          '👩🏼‍🦰',
+          '👩🏽‍🦰',
+          '👩🏾‍🦰',
+          '👩🏿‍🦰',
+          '👩‍🦱',
+          '👩🏻‍🦱',
+          '👩🏼‍🦱',
+          '👩🏽‍🦱',
+          '👩🏾‍🦱',
+          '👩🏿‍🦱',
+          '👩‍🦳',
+          '👩🏻‍🦳',
+          '👩🏼‍🦳',
+          '👩🏽‍🦳',
+          '👩🏾‍🦳',
+          '👩🏿‍🦳',
+          '👩‍🦲',
+          '👩🏻‍🦲',
+          '👩🏼‍🦲',
+          '👩🏽‍🦲',
+          '👩🏾‍🦲',
+          '👩🏿‍🦲',
+          '🧓',
+          '🧓🏻',
+          '🧓🏼',
+          '🧓🏽',
+          '🧓🏾',
+          '🧓🏿',
+          '👴',
+          '👴🏻',
+          '👴🏼',
+          '👴🏽',
+          '👴🏾',
+          '👴🏿',
+          '👵',
+          '👵🏻',
+          '👵🏼',
+          '👵🏽',
+          '👵🏾',
+          '👵🏿',
+          '🙍',
+          '🙍🏻',
+          '🙍🏼',
+          '🙍🏽',
+          '🙍🏾',
+          '🙍🏿',
+          '🙍‍♂️',
+          '🙍‍♂',
+          '🙍🏻‍♂️',
+          '🙍🏻‍♂',
+          '🙍🏼‍♂️',
+          '🙍🏼‍♂',
+          '🙍🏽‍♂️',
+          '🙍🏽‍♂',
+          '🙍🏾‍♂️',
+          '🙍🏾‍♂',
+          '🙍🏿‍♂️',
+          '🙍🏿‍♂',
+          '🙍‍♀️',
+          '🙍‍♀',
+          '🙍🏻‍♀️',
+          '🙍🏻‍♀',
+          '🙍🏼‍♀️',
+          '🙍🏼‍♀',
+          '🙍🏽‍♀️',
+          '🙍🏽‍♀',
+          '🙍🏾‍♀️',
+          '🙍🏾‍♀',
+          '🙍🏿‍♀️',
+          '🙍🏿‍♀',
+          '🙎',
+          '🙎🏻',
+          '🙎🏼',
+          '🙎🏽',
+          '🙎🏾',
+          '🙎🏿',
+          '🙎‍♂️',
+          '🙎‍♂',
+          '🙎🏻‍♂️',
+          '🙎🏻‍♂',
+          '🙎🏼‍♂️',
+          '🙎🏼‍♂',
+          '🙎🏽‍♂️',
+          '🙎🏽‍♂',
+          '🙎🏾‍♂️',
+          '🙎🏾‍♂',
+          '🙎🏿‍♂️',
+          '🙎🏿‍♂',
+          '🙎‍♀️',
+          '🙎‍♀',
+          '🙎🏻‍♀️',
+          '🙎🏻‍♀',
+          '🙎🏼‍♀️',
+          '🙎🏼‍♀',
+          '🙎🏽‍♀️',
+          '🙎🏽‍♀',
+          '🙎🏾‍♀️',
+          '🙎🏾‍♀',
+          '🙎🏿‍♀️',
+          '🙎🏿‍♀',
           '🙅',
+          '🙅🏻',
+          '🙅🏼',
+          '🙅🏽',
+          '🙅🏾',
+          '🙅🏿',
+          '🙅‍♂️',
+          '🙅‍♂',
+          '🙅🏻‍♂️',
+          '🙅🏻‍♂',
+          '🙅🏼‍♂️',
+          '🙅🏼‍♂',
+          '🙅🏽‍♂️',
+          '🙅🏽‍♂',
+          '🙅🏾‍♂️',
+          '🙅🏾‍♂',
+          '🙅🏿‍♂️',
+          '🙅🏿‍♂',
+          '🙅‍♀️',
+          '🙅‍♀',
+          '🙅🏻‍♀️',
+          '🙅🏻‍♀',
+          '🙅🏼‍♀️',
+          '🙅🏼‍♀',
+          '🙅🏽‍♀️',
+          '🙅🏽‍♀',
+          '🙅🏾‍♀️',
+          '🙅🏾‍♀',
+          '🙅🏿‍♀️',
+          '🙅🏿‍♀',
           '🙆',
+          '🙆🏻',
+          '🙆🏼',
+          '🙆🏽',
+          '🙆🏾',
+          '🙆🏿',
+          '🙆‍♂️',
+          '🙆‍♂',
+          '🙆🏻‍♂️',
+          '🙆🏻‍♂',
+          '🙆🏼‍♂️',
+          '🙆🏼‍♂',
+          '🙆🏽‍♂️',
+          '🙆🏽‍♂',
+          '🙆🏾‍♂️',
+          '🙆🏾‍♂',
+          '🙆🏿‍♂️',
+          '🙆🏿‍♂',
+          '🙆‍♀️',
+          '🙆‍♀',
+          '🙆🏻‍♀️',
+          '🙆🏻‍♀',
+          '🙆🏼‍♀️',
+          '🙆🏼‍♀',
+          '🙆🏽‍♀️',
+          '🙆🏽‍♀',
+          '🙆🏾‍♀️',
+          '🙆🏾‍♀',
+          '🙆🏿‍♀️',
+          '🙆🏿‍♀',
           '💁',
+          '💁🏻',
+          '💁🏼',
+          '💁🏽',
+          '💁🏾',
+          '💁🏿',
+          '💁‍♂️',
+          '💁‍♂',
+          '💁🏻‍♂️',
+          '💁🏻‍♂',
+          '💁🏼‍♂️',
+          '💁🏼‍♂',
+          '💁🏽‍♂️',
+          '💁🏽‍♂',
+          '💁🏾‍♂️',
+          '💁🏾‍♂',
+          '💁🏿‍♂️',
+          '💁🏿‍♂',
+          '💁‍♀️',
+          '💁‍♀',
+          '💁🏻‍♀️',
+          '💁🏻‍♀',
+          '💁🏼‍♀️',
+          '💁🏼‍♀',
+          '💁🏽‍♀️',
+          '💁🏽‍♀',
+          '💁🏾‍♀️',
+          '💁🏾‍♀',
+          '💁🏿‍♀️',
+          '💁🏿‍♀',
           '🙋',
+          '🙋🏻',
+          '🙋🏼',
+          '🙋🏽',
+          '🙋🏾',
+          '🙋🏿',
+          '🙋‍♂️',
+          '🙋‍♂',
+          '🙋🏻‍♂️',
+          '🙋🏻‍♂',
+          '🙋🏼‍♂️',
+          '🙋🏼‍♂',
+          '🙋🏽‍♂️',
+          '🙋🏽‍♂',
+          '🙋🏾‍♂️',
+          '🙋🏾‍♂',
+          '🙋🏿‍♂️',
+          '🙋🏿‍♂',
+          '🙋‍♀️',
+          '🙋‍♀',
+          '🙋🏻‍♀️',
+          '🙋🏻‍♀',
+          '🙋🏼‍♀️',
+          '🙋🏼‍♀',
+          '🙋🏽‍♀️',
+          '🙋🏽‍♀',
+          '🙋🏾‍♀️',
+          '🙋🏾‍♀',
+          '🙋🏿‍♀️',
+          '🙋🏿‍♀',
+          '🧏',
+          '🧏🏻',
+          '🧏🏼',
+          '🧏🏽',
+          '🧏🏾',
+          '🧏🏿',
+          '🧏‍♂️',
+          '🧏‍♂',
+          '🧏🏻‍♂️',
+          '🧏🏻‍♂',
+          '🧏🏼‍♂️',
+          '🧏🏼‍♂',
+          '🧏🏽‍♂️',
+          '🧏🏽‍♂',
+          '🧏🏾‍♂️',
+          '🧏🏾‍♂',
+          '🧏🏿‍♂️',
+          '🧏🏿‍♂',
+          '🧏‍♀️',
+          '🧏‍♀',
+          '🧏🏻‍♀️',
+          '🧏🏻‍♀',
+          '🧏🏼‍♀️',
+          '🧏🏼‍♀',
+          '🧏🏽‍♀️',
+          '🧏🏽‍♀',
+          '🧏🏾‍♀️',
+          '🧏🏾‍♀',
+          '🧏🏿‍♀️',
+          '🧏🏿‍♀',
           '🙇',
+          '🙇🏻',
+          '🙇🏼',
+          '🙇🏽',
+          '🙇🏾',
+          '🙇🏿',
+          '🙇‍♂️',
+          '🙇‍♂',
+          '🙇🏻‍♂️',
+          '🙇🏻‍♂',
+          '🙇🏼‍♂️',
+          '🙇🏼‍♂',
+          '🙇🏽‍♂️',
+          '🙇🏽‍♂',
+          '🙇🏾‍♂️',
+          '🙇🏾‍♂',
+          '🙇🏿‍♂️',
+          '🙇🏿‍♂',
+          '🙇‍♀️',
+          '🙇‍♀',
+          '🙇🏻‍♀️',
+          '🙇🏻‍♀',
+          '🙇🏼‍♀️',
+          '🙇🏼‍♀',
+          '🙇🏽‍♀️',
+          '🙇🏽‍♀',
+          '🙇🏾‍♀️',
+          '🙇🏾‍♀',
+          '🙇🏿‍♀️',
+          '🙇🏿‍♀',
+          '🤦',
+          '🤦🏻',
+          '🤦🏼',
+          '🤦🏽',
+          '🤦🏾',
+          '🤦🏿',
+          '🤦‍♂️',
+          '🤦‍♂',
+          '🤦🏻‍♂️',
+          '🤦🏻‍♂',
+          '🤦🏼‍♂️',
+          '🤦🏼‍♂',
+          '🤦🏽‍♂️',
+          '🤦🏽‍♂',
+          '🤦🏾‍♂️',
+          '🤦🏾‍♂',
+          '🤦🏿‍♂️',
+          '🤦🏿‍♂',
+          '🤦‍♀️',
+          '🤦‍♀',
+          '🤦🏻‍♀️',
+          '🤦🏻‍♀',
+          '🤦🏼‍♀️',
+          '🤦🏼‍♀',
+          '🤦🏽‍♀️',
+          '🤦🏽‍♀',
+          '🤦🏾‍♀️',
+          '🤦🏾‍♀',
+          '🤦🏿‍♀️',
+          '🤦🏿‍♀',
+          '🤷',
+          '🤷🏻',
+          '🤷🏼',
+          '🤷🏽',
+          '🤷🏾',
+          '🤷🏿',
+          '🤷‍♂️',
+          '🤷‍♂',
+          '🤷🏻‍♂️',
+          '🤷🏻‍♂',
+          '🤷🏼‍♂️',
+          '🤷🏼‍♂',
+          '🤷🏽‍♂️',
+          '🤷🏽‍♂',
+          '🤷🏾‍♂️',
+          '🤷🏾‍♂',
+          '🤷🏿‍♂️',
+          '🤷🏿‍♂',
+          '🤷‍♀️',
+          '🤷‍♀',
+          '🤷🏻‍♀️',
+          '🤷🏻‍♀',
+          '🤷🏼‍♀️',
+          '🤷🏼‍♀',
+          '🤷🏽‍♀️',
+          '🤷🏽‍♀',
+          '🤷🏾‍♀️',
+          '🤷🏾‍♀',
+          '🤷🏿‍♀️',
+          '🤷🏿‍♀',
+          '👨‍⚕️',
+          '👨‍⚕',
+          '👨🏻‍⚕️',
+          '👨🏻‍⚕',
+          '👨🏼‍⚕️',
+          '👨🏼‍⚕',
+          '👨🏽‍⚕️',
+          '👨🏽‍⚕',
+          '👨🏾‍⚕️',
+          '👨🏾‍⚕',
+          '👨🏿‍⚕️',
+          '👨🏿‍⚕',
+          '👩‍⚕️',
+          '👩‍⚕',
+          '👩🏻‍⚕️',
+          '👩🏻‍⚕',
+          '👩🏼‍⚕️',
+          '👩🏼‍⚕',
+          '👩🏽‍⚕️',
+          '👩🏽‍⚕',
+          '👩🏾‍⚕️',
+          '👩🏾‍⚕',
+          '👩🏿‍⚕️',
+          '👩🏿‍⚕',
+          '👨‍🎓',
+          '👨🏻‍🎓',
+          '👨🏼‍🎓',
+          '👨🏽‍🎓',
+          '👨🏾‍🎓',
+          '👨🏿‍🎓',
+          '👩‍🎓',
+          '👩🏻‍🎓',
+          '👩🏼‍🎓',
+          '👩🏽‍🎓',
+          '👩🏾‍🎓',
+          '👩🏿‍🎓',
+          '👨‍🏫',
+          '👨🏻‍🏫',
+          '👨🏼‍🏫',
+          '👨🏽‍🏫',
+          '👨🏾‍🏫',
+          '👨🏿‍🏫',
+          '👩‍🏫',
+          '👩🏻‍🏫',
+          '👩🏼‍🏫',
+          '👩🏽‍🏫',
+          '👩🏾‍🏫',
+          '👩🏿‍🏫',
+          '👨‍⚖️',
+          '👨‍⚖',
+          '👨🏻‍⚖️',
+          '👨🏻‍⚖',
+          '👨🏼‍⚖️',
+          '👨🏼‍⚖',
+          '👨🏽‍⚖️',
+          '👨🏽‍⚖',
+          '👨🏾‍⚖️',
+          '👨🏾‍⚖',
+          '👨🏿‍⚖️',
+          '👨🏿‍⚖',
+          '👩‍⚖️',
+          '👩‍⚖',
+          '👩🏻‍⚖️',
+          '👩🏻‍⚖',
+          '👩🏼‍⚖️',
+          '👩🏼‍⚖',
+          '👩🏽‍⚖️',
+          '👩🏽‍⚖',
+          '👩🏾‍⚖️',
+          '👩🏾‍⚖',
+          '👩🏿‍⚖️',
+          '👩🏿‍⚖',
+          '👨‍🌾',
+          '👨🏻‍🌾',
+          '👨🏼‍🌾',
+          '👨🏽‍🌾',
+          '👨🏾‍🌾',
+          '👨🏿‍🌾',
+          '👩‍🌾',
+          '👩🏻‍🌾',
+          '👩🏼‍🌾',
+          '👩🏽‍🌾',
+          '👩🏾‍🌾',
+          '👩🏿‍🌾',
+          '👨‍🍳',
+          '👨🏻‍🍳',
+          '👨🏼‍🍳',
+          '👨🏽‍🍳',
+          '👨🏾‍🍳',
+          '👨🏿‍🍳',
+          '👩‍🍳',
+          '👩🏻‍🍳',
+          '👩🏼‍🍳',
+          '👩🏽‍🍳',
+          '👩🏾‍🍳',
+          '👩🏿‍🍳',
+          '👨‍🔧',
+          '👨🏻‍🔧',
+          '👨🏼‍🔧',
+          '👨🏽‍🔧',
+          '👨🏾‍🔧',
+          '👨🏿‍🔧',
+          '👩‍🔧',
+          '👩🏻‍🔧',
+          '👩🏼‍🔧',
+          '👩🏽‍🔧',
+          '👩🏾‍🔧',
+          '👩🏿‍🔧',
+          '👨‍🏭',
+          '👨🏻‍🏭',
+          '👨🏼‍🏭',
+          '👨🏽‍🏭',
+          '👨🏾‍🏭',
+          '👨🏿‍🏭',
+          '👩‍🏭',
+          '👩🏻‍🏭',
+          '👩🏼‍🏭',
+          '👩🏽‍🏭',
+          '👩🏾‍🏭',
+          '👩🏿‍🏭',
+          '👨‍💼',
+          '👨🏻‍💼',
+          '👨🏼‍💼',
+          '👨🏽‍💼',
+          '👨🏾‍💼',
+          '👨🏿‍💼',
+          '👩‍💼',
+          '👩🏻‍💼',
+          '👩🏼‍💼',
+          '👩🏽‍💼',
+          '👩🏾‍💼',
+          '👩🏿‍💼',
+          '👨‍🔬',
+          '👨🏻‍🔬',
+          '👨🏼‍🔬',
+          '👨🏽‍🔬',
+          '👨🏾‍🔬',
+          '👨🏿‍🔬',
+          '👩‍🔬',
+          '👩🏻‍🔬',
+          '👩🏼‍🔬',
+          '👩🏽‍🔬',
+          '👩🏾‍🔬',
+          '👩🏿‍🔬',
+          '👨‍💻',
+          '👨🏻‍💻',
+          '👨🏼‍💻',
+          '👨🏽‍💻',
+          '👨🏾‍💻',
+          '👨🏿‍💻',
+          '👩‍💻',
+          '👩🏻‍💻',
+          '👩🏼‍💻',
+          '👩🏽‍💻',
+          '👩🏾‍💻',
+          '👩🏿‍💻',
+          '👨‍🎤',
+          '👨🏻‍🎤',
+          '👨🏼‍🎤',
+          '👨🏽‍🎤',
+          '👨🏾‍🎤',
+          '👨🏿‍🎤',
+          '👩‍🎤',
+          '👩🏻‍🎤',
+          '👩🏼‍🎤',
+          '👩🏽‍🎤',
+          '👩🏾‍🎤',
+          '👩🏿‍🎤',
+          '👨‍🎨',
+          '👨🏻‍🎨',
+          '👨🏼‍🎨',
+          '👨🏽‍🎨',
+          '👨🏾‍🎨',
+          '👨🏿‍🎨',
+          '👩‍🎨',
+          '👩🏻‍🎨',
+          '👩🏼‍🎨',
+          '👩🏽‍🎨',
+          '👩🏾‍🎨',
+          '👩🏿‍🎨',
+          '👨‍✈️',
+          '👨‍✈',
+          '👨🏻‍✈️',
+          '👨🏻‍✈',
+          '👨🏼‍✈️',
+          '👨🏼‍✈',
+          '👨🏽‍✈️',
+          '👨🏽‍✈',
+          '👨🏾‍✈️',
+          '👨🏾‍✈',
+          '👨🏿‍✈️',
+          '👨🏿‍✈',
+          '👩‍✈️',
+          '👩‍✈',
+          '👩🏻‍✈️',
+          '👩🏻‍✈',
+          '👩🏼‍✈️',
+          '👩🏼‍✈',
+          '👩🏽‍✈️',
+          '👩🏽‍✈',
+          '👩🏾‍✈️',
+          '👩🏾‍✈',
+          '👩🏿‍✈️',
+          '👩🏿‍✈',
+          '👨‍🚀',
+          '👨🏻‍🚀',
+          '👨🏼‍🚀',
+          '👨🏽‍🚀',
+          '👨🏾‍🚀',
+          '👨🏿‍🚀',
+          '👩‍🚀',
+          '👩🏻‍🚀',
+          '👩🏼‍🚀',
+          '👩🏽‍🚀',
+          '👩🏾‍🚀',
+          '👩🏿‍🚀',
+          '👨‍🚒',
+          '👨🏻‍🚒',
+          '👨🏼‍🚒',
+          '👨🏽‍🚒',
+          '👨🏾‍🚒',
+          '👨🏿‍🚒',
+          '👩‍🚒',
+          '👩🏻‍🚒',
+          '👩🏼‍🚒',
+          '👩🏽‍🚒',
+          '👩🏾‍🚒',
+          '👩🏿‍🚒',
+          '👮',
+          '👮🏻',
+          '👮🏼',
+          '👮🏽',
+          '👮🏾',
+          '👮🏿',
+          '👮‍♂️',
+          '👮‍♂',
+          '👮🏻‍♂️',
+          '👮🏻‍♂',
+          '👮🏼‍♂️',
+          '👮🏼‍♂',
+          '👮🏽‍♂️',
+          '👮🏽‍♂',
+          '👮🏾‍♂️',
+          '👮🏾‍♂',
+          '👮🏿‍♂️',
+          '👮🏿‍♂',
+          '👮‍♀️',
+          '👮‍♀',
+          '👮🏻‍♀️',
+          '👮🏻‍♀',
+          '👮🏼‍♀️',
+          '👮🏼‍♀',
+          '👮🏽‍♀️',
+          '👮🏽‍♀',
+          '👮🏾‍♀️',
+          '👮🏾‍♀',
+          '👮🏿‍♀️',
+          '👮🏿‍♀',
+          '🕵️',
+          '🕵',
+          '🕵🏻',
+          '🕵🏼',
+          '🕵🏽',
+          '🕵🏾',
+          '🕵🏿',
+          '🕵️‍♂️',
+          '🕵‍♂️',
+          '🕵️‍♂',
+          '🕵‍♂',
+          '🕵🏻‍♂️',
+          '🕵🏻‍♂',
+          '🕵🏼‍♂️',
+          '🕵🏼‍♂',
+          '🕵🏽‍♂️',
+          '🕵🏽‍♂',
+          '🕵🏾‍♂️',
+          '🕵🏾‍♂',
+          '🕵🏿‍♂️',
+          '🕵🏿‍♂',
+          '🕵️‍♀️',
+          '🕵‍♀️',
+          '🕵️‍♀',
+          '🕵‍♀',
+          '🕵🏻‍♀️',
+          '🕵🏻‍♀',
+          '🕵🏼‍♀️',
+          '🕵🏼‍♀',
+          '🕵🏽‍♀️',
+          '🕵🏽‍♀',
+          '🕵🏾‍♀️',
+          '🕵🏾‍♀',
+          '🕵🏿‍♀️',
+          '🕵🏿‍♀',
+          '💂',
+          '💂🏻',
+          '💂🏼',
+          '💂🏽',
+          '💂🏾',
+          '💂🏿',
+          '💂‍♂️',
+          '💂‍♂',
+          '💂🏻‍♂️',
+          '💂🏻‍♂',
+          '💂🏼‍♂️',
+          '💂🏼‍♂',
+          '💂🏽‍♂️',
+          '💂🏽‍♂',
+          '💂🏾‍♂️',
+          '💂🏾‍♂',
+          '💂🏿‍♂️',
+          '💂🏿‍♂',
+          '💂‍♀️',
+          '💂‍♀',
+          '💂🏻‍♀️',
+          '💂🏻‍♀',
+          '💂🏼‍♀️',
+          '💂🏼‍♀',
+          '💂🏽‍♀️',
+          '💂🏽‍♀',
+          '💂🏾‍♀️',
+          '💂🏾‍♀',
+          '💂🏿‍♀️',
+          '💂🏿‍♀',
+          '👷',
+          '👷🏻',
+          '👷🏼',
+          '👷🏽',
+          '👷🏾',
+          '👷🏿',
+          '👷‍♂️',
+          '👷‍♂',
+          '👷🏻‍♂️',
+          '👷🏻‍♂',
+          '👷🏼‍♂️',
+          '👷🏼‍♂',
+          '👷🏽‍♂️',
+          '👷🏽‍♂',
+          '👷🏾‍♂️',
+          '👷🏾‍♂',
+          '👷🏿‍♂️',
+          '👷🏿‍♂',
+          '👷‍♀️',
+          '👷‍♀',
+          '👷🏻‍♀️',
+          '👷🏻‍♀',
+          '👷🏼‍♀️',
+          '👷🏼‍♀',
+          '👷🏽‍♀️',
+          '👷🏽‍♀',
+          '👷🏾‍♀️',
+          '👷🏾‍♀',
+          '👷🏿‍♀️',
+          '👷🏿‍♀',
+          '🤴',
+          '🤴🏻',
+          '🤴🏼',
+          '🤴🏽',
+          '🤴🏾',
+          '🤴🏿',
           '👸',
+          '👸🏻',
+          '👸🏼',
+          '👸🏽',
+          '👸🏾',
+          '👸🏿',
+          '👳',
+          '👳🏻',
+          '👳🏼',
+          '👳🏽',
+          '👳🏾',
+          '👳🏿',
+          '👳‍♂️',
+          '👳‍♂',
+          '👳🏻‍♂️',
+          '👳🏻‍♂',
+          '👳🏼‍♂️',
+          '👳🏼‍♂',
+          '👳🏽‍♂️',
+          '👳🏽‍♂',
+          '👳🏾‍♂️',
+          '👳🏾‍♂',
+          '👳🏿‍♂️',
+          '👳🏿‍♂',
+          '👳‍♀️',
+          '👳‍♀',
+          '👳🏻‍♀️',
+          '👳🏻‍♀',
+          '👳🏼‍♀️',
+          '👳🏼‍♀',
+          '👳🏽‍♀️',
+          '👳🏽‍♀',
+          '👳🏾‍♀️',
+          '👳🏾‍♀',
+          '👳🏿‍♀️',
+          '👳🏿‍♀',
+          '👲',
+          '👲🏻',
+          '👲🏼',
+          '👲🏽',
+          '👲🏾',
+          '👲🏿',
+          '🧕',
+          '🧕🏻',
+          '🧕🏼',
+          '🧕🏽',
+          '🧕🏾',
+          '🧕🏿',
+          '🤵',
+          '🤵🏻',
+          '🤵🏼',
+          '🤵🏽',
+          '🤵🏾',
+          '🤵🏿',
           '👰',
+          '👰🏻',
+          '👰🏼',
+          '👰🏽',
+          '👰🏾',
+          '👰🏿',
+          '🤰',
+          '🤰🏻',
+          '🤰🏼',
+          '🤰🏽',
+          '🤰🏾',
+          '🤰🏿',
+          '🤱',
+          '🤱🏻',
+          '🤱🏼',
+          '🤱🏽',
+          '🤱🏾',
+          '🤱🏿',
           '👼',
+          '👼🏻',
+          '👼🏼',
+          '👼🏽',
+          '👼🏾',
+          '👼🏿',
           '🎅',
+          '🎅🏻',
+          '🎅🏼',
+          '🎅🏽',
+          '🎅🏾',
+          '🎅🏿',
+          '🤶',
+          '🤶🏻',
+          '🤶🏼',
+          '🤶🏽',
+          '🤶🏾',
+          '🤶🏿',
+          '🦸',
+          '🦸🏻',
+          '🦸🏼',
+          '🦸🏽',
+          '🦸🏾',
+          '🦸🏿',
+          '🦸‍♂️',
+          '🦸‍♂',
+          '🦸🏻‍♂️',
+          '🦸🏻‍♂',
+          '🦸🏼‍♂️',
+          '🦸🏼‍♂',
+          '🦸🏽‍♂️',
+          '🦸🏽‍♂',
+          '🦸🏾‍♂️',
+          '🦸🏾‍♂',
+          '🦸🏿‍♂️',
+          '🦸🏿‍♂',
+          '🦸‍♀️',
+          '🦸‍♀',
+          '🦸🏻‍♀️',
+          '🦸🏻‍♀',
+          '🦸🏼‍♀️',
+          '🦸🏼‍♀',
+          '🦸🏽‍♀️',
+          '🦸🏽‍♀',
+          '🦸🏾‍♀️',
+          '🦸🏾‍♀',
+          '🦸🏿‍♀️',
+          '🦸🏿‍♀',
+          '🦹',
+          '🦹🏻',
+          '🦹🏼',
+          '🦹🏽',
+          '🦹🏾',
+          '🦹🏿',
+          '🦹‍♂️',
+          '🦹‍♂',
+          '🦹🏻‍♂️',
+          '🦹🏻‍♂',
+          '🦹🏼‍♂️',
+          '🦹🏼‍♂',
+          '🦹🏽‍♂️',
+          '🦹🏽‍♂',
+          '🦹🏾‍♂️',
+          '🦹🏾‍♂',
+          '🦹🏿‍♂️',
+          '🦹🏿‍♂',
+          '🦹‍♀️',
+          '🦹‍♀',
+          '🦹🏻‍♀️',
+          '🦹🏻‍♀',
+          '🦹🏼‍♀️',
+          '🦹🏼‍♀',
+          '🦹🏽‍♀️',
+          '🦹🏽‍♀',
+          '🦹🏾‍♀️',
+          '🦹🏾‍♀',
+          '🦹🏿‍♀️',
+          '🦹🏿‍♀',
+          '🧙',
+          '🧙🏻',
+          '🧙🏼',
+          '🧙🏽',
+          '🧙🏾',
+          '🧙🏿',
+          '🧙‍♂️',
+          '🧙‍♂',
+          '🧙🏻‍♂️',
+          '🧙🏻‍♂',
+          '🧙🏼‍♂️',
+          '🧙🏼‍♂',
+          '🧙🏽‍♂️',
+          '🧙🏽‍♂',
+          '🧙🏾‍♂️',
+          '🧙🏾‍♂',
+          '🧙🏿‍♂️',
+          '🧙🏿‍♂',
+          '🧙‍♀️',
+          '🧙‍♀',
+          '🧙🏻‍♀️',
+          '🧙🏻‍♀',
+          '🧙🏼‍♀️',
+          '🧙🏼‍♀',
+          '🧙🏽‍♀️',
+          '🧙🏽‍♀',
+          '🧙🏾‍♀️',
+          '🧙🏾‍♀',
+          '🧙🏿‍♀️',
+          '🧙🏿‍♀',
+          '🧚',
+          '🧚🏻',
+          '🧚🏼',
+          '🧚🏽',
+          '🧚🏾',
+          '🧚🏿',
+          '🧚‍♂️',
+          '🧚‍♂',
+          '🧚🏻‍♂️',
+          '🧚🏻‍♂',
+          '🧚🏼‍♂️',
+          '🧚🏼‍♂',
+          '🧚🏽‍♂️',
+          '🧚🏽‍♂',
+          '🧚🏾‍♂️',
+          '🧚🏾‍♂',
+          '🧚🏿‍♂️',
+          '🧚🏿‍♂',
+          '🧚‍♀️',
+          '🧚‍♀',
+          '🧚🏻‍♀️',
+          '🧚🏻‍♀',
+          '🧚🏼‍♀️',
+          '🧚🏼‍♀',
+          '🧚🏽‍♀️',
+          '🧚🏽‍♀',
+          '🧚🏾‍♀️',
+          '🧚🏾‍♀',
+          '🧚🏿‍♀️',
+          '🧚🏿‍♀',
+          '🧛',
+          '🧛🏻',
+          '🧛🏼',
+          '🧛🏽',
+          '🧛🏾',
+          '🧛🏿',
+          '🧛‍♂️',
+          '🧛‍♂',
+          '🧛🏻‍♂️',
+          '🧛🏻‍♂',
+          '🧛🏼‍♂️',
+          '🧛🏼‍♂',
+          '🧛🏽‍♂️',
+          '🧛🏽‍♂',
+          '🧛🏾‍♂️',
+          '🧛🏾‍♂',
+          '🧛🏿‍♂️',
+          '🧛🏿‍♂',
+          '🧛‍♀️',
+          '🧛‍♀',
+          '🧛🏻‍♀️',
+          '🧛🏻‍♀',
+          '🧛🏼‍♀️',
+          '🧛🏼‍♀',
+          '🧛🏽‍♀️',
+          '🧛🏽‍♀',
+          '🧛🏾‍♀️',
+          '🧛🏾‍♀',
+          '🧛🏿‍♀️',
+          '🧛🏿‍♀',
+          '🧜',
+          '🧜🏻',
+          '🧜🏼',
+          '🧜🏽',
+          '🧜🏾',
+          '🧜🏿',
+          '🧜‍♂️',
+          '🧜‍♂',
+          '🧜🏻‍♂️',
+          '🧜🏻‍♂',
+          '🧜🏼‍♂️',
+          '🧜🏼‍♂',
+          '🧜🏽‍♂️',
+          '🧜🏽‍♂',
+          '🧜🏾‍♂️',
+          '🧜🏾‍♂',
+          '🧜🏿‍♂️',
+          '🧜🏿‍♂',
+          '🧜‍♀️',
+          '🧜‍♀',
+          '🧜🏻‍♀️',
+          '🧜🏻‍♀',
+          '🧜🏼‍♀️',
+          '🧜🏼‍♀',
+          '🧜🏽‍♀️',
+          '🧜🏽‍♀',
+          '🧜🏾‍♀️',
+          '🧜🏾‍♀',
+          '🧜🏿‍♀️',
+          '🧜🏿‍♀',
+          '🧝',
+          '🧝🏻',
+          '🧝🏼',
+          '🧝🏽',
+          '🧝🏾',
+          '🧝🏿',
+          '🧝‍♂️',
+          '🧝‍♂',
+          '🧝🏻‍♂️',
+          '🧝🏻‍♂',
+          '🧝🏼‍♂️',
+          '🧝🏼‍♂',
+          '🧝🏽‍♂️',
+          '🧝🏽‍♂',
+          '🧝🏾‍♂️',
+          '🧝🏾‍♂',
+          '🧝🏿‍♂️',
+          '🧝🏿‍♂',
+          '🧝‍♀️',
+          '🧝‍♀',
+          '🧝🏻‍♀️',
+          '🧝🏻‍♀',
+          '🧝🏼‍♀️',
+          '🧝🏼‍♀',
+          '🧝🏽‍♀️',
+          '🧝🏽‍♀',
+          '🧝🏾‍♀️',
+          '🧝🏾‍♀',
+          '🧝🏿‍♀️',
+          '🧝🏿‍♀',
+          '🧞',
+          '🧞‍♂️',
+          '🧞‍♂',
+          '🧞‍♀️',
+          '🧞‍♀',
+          '🧟',
+          '🧟‍♂️',
+          '🧟‍♂',
+          '🧟‍♀️',
+          '🧟‍♀',
+          '💆',
+          '💆🏻',
+          '💆🏼',
+          '💆🏽',
+          '💆🏾',
+          '💆🏿',
+          '💆‍♂️',
+          '💆‍♂',
+          '💆🏻‍♂️',
+          '💆🏻‍♂',
+          '💆🏼‍♂️',
+          '💆🏼‍♂',
+          '💆🏽‍♂️',
+          '💆🏽‍♂',
+          '💆🏾‍♂️',
+          '💆🏾‍♂',
+          '💆🏿‍♂️',
+          '💆🏿‍♂',
+          '💆‍♀️',
+          '💆‍♀',
+          '💆🏻‍♀️',
+          '💆🏻‍♀',
+          '💆🏼‍♀️',
+          '💆🏼‍♀',
+          '💆🏽‍♀️',
+          '💆🏽‍♀',
+          '💆🏾‍♀️',
+          '💆🏾‍♀',
+          '💆🏿‍♀️',
+          '💆🏿‍♀',
           '💇',
+          '💇🏻',
+          '💇🏼',
+          '💇🏽',
+          '💇🏾',
+          '💇🏿',
+          '💇‍♂️',
+          '💇‍♂',
+          '💇🏻‍♂️',
+          '💇🏻‍♂',
+          '💇🏼‍♂️',
+          '💇🏼‍♂',
+          '💇🏽‍♂️',
+          '💇🏽‍♂',
+          '💇🏾‍♂️',
+          '💇🏾‍♂',
+          '💇🏿‍♂️',
+          '💇🏿‍♂',
+          '💇‍♀️',
+          '💇‍♀',
+          '💇🏻‍♀️',
+          '💇🏻‍♀',
+          '💇🏼‍♀️',
+          '💇🏼‍♀',
+          '💇🏽‍♀️',
+          '💇🏽‍♀',
+          '💇🏾‍♀️',
+          '💇🏾‍♀',
+          '💇🏿‍♀️',
+          '💇🏿‍♀',
+          '🚶',
+          '🚶🏻',
+          '🚶🏼',
+          '🚶🏽',
+          '🚶🏾',
+          '🚶🏿',
+          '🚶‍♂️',
+          '🚶‍♂',
+          '🚶🏻‍♂️',
+          '🚶🏻‍♂',
+          '🚶🏼‍♂️',
+          '🚶🏼‍♂',
+          '🚶🏽‍♂️',
+          '🚶🏽‍♂',
+          '🚶🏾‍♂️',
+          '🚶🏾‍♂',
+          '🚶🏿‍♂️',
+          '🚶🏿‍♂',
+          '🚶‍♀️',
+          '🚶‍♀',
+          '🚶🏻‍♀️',
+          '🚶🏻‍♀',
+          '🚶🏼‍♀️',
+          '🚶🏼‍♀',
+          '🚶🏽‍♀️',
+          '🚶🏽‍♀',
+          '🚶🏾‍♀️',
+          '🚶🏾‍♀',
+          '🚶🏿‍♀️',
+          '🚶🏿‍♀',
+          '🧍',
+          '🧍🏻',
+          '🧍🏼',
+          '🧍🏽',
+          '🧍🏾',
+          '🧍🏿',
+          '🧍‍♂️',
+          '🧍‍♂',
+          '🧍🏻‍♂️',
+          '🧍🏻‍♂',
+          '🧍🏼‍♂️',
+          '🧍🏼‍♂',
+          '🧍🏽‍♂️',
+          '🧍🏽‍♂',
+          '🧍🏾‍♂️',
+          '🧍🏾‍♂',
+          '🧍🏿‍♂️',
+          '🧍🏿‍♂',
+          '🧍‍♀️',
+          '🧍‍♀',
+          '🧍🏻‍♀️',
+          '🧍🏻‍♀',
+          '🧍🏼‍♀️',
+          '🧍🏼‍♀',
+          '🧍🏽‍♀️',
+          '🧍🏽‍♀',
+          '🧍🏾‍♀️',
+          '🧍🏾‍♀',
+          '🧍🏿‍♀️',
+          '🧍🏿‍♀',
+          '🧎',
+          '🧎🏻',
+          '🧎🏼',
+          '🧎🏽',
+          '🧎🏾',
+          '🧎🏿',
+          '🧎‍♂️',
+          '🧎‍♂',
+          '🧎🏻‍♂️',
+          '🧎🏻‍♂',
+          '🧎🏼‍♂️',
+          '🧎🏼‍♂',
+          '🧎🏽‍♂️',
+          '🧎🏽‍♂',
+          '🧎🏾‍♂️',
+          '🧎🏾‍♂',
+          '🧎🏿‍♂️',
+          '🧎🏿‍♂',
+          '🧎‍♀️',
+          '🧎‍♀',
+          '🧎🏻‍♀️',
+          '🧎🏻‍♀',
+          '🧎🏼‍♀️',
+          '🧎🏼‍♀',
+          '🧎🏽‍♀️',
+          '🧎🏽‍♀',
+          '🧎🏾‍♀️',
+          '🧎🏾‍♀',
+          '🧎🏿‍♀️',
+          '🧎🏿‍♀',
+          '👨‍🦯',
+          '👨🏻‍🦯',
+          '👨🏼‍🦯',
+          '👨🏽‍🦯',
+          '👨🏾‍🦯',
+          '👨🏿‍🦯',
+          '👩‍🦯',
+          '👩🏻‍🦯',
+          '👩🏼‍🦯',
+          '👩🏽‍🦯',
+          '👩🏾‍🦯',
+          '👩🏿‍🦯',
+          '👨‍🦼',
+          '👨🏻‍🦼',
+          '👨🏼‍🦼',
+          '👨🏽‍🦼',
+          '👨🏾‍🦼',
+          '👨🏿‍🦼',
+          '👩‍🦼',
+          '👩🏻‍🦼',
+          '👩🏼‍🦼',
+          '👩🏽‍🦼',
+          '👩🏾‍🦼',
+          '👩🏿‍🦼',
+          '👨‍🦽',
+          '👨🏻‍🦽',
+          '👨🏼‍🦽',
+          '👨🏽‍🦽',
+          '👨🏾‍🦽',
+          '👨🏿‍🦽',
+          '👩‍🦽',
+          '👩🏻‍🦽',
+          '👩🏼‍🦽',
+          '👩🏽‍🦽',
+          '👩🏾‍🦽',
+          '👩🏿‍🦽',
           '🏃',
+          '🏃🏻',
+          '🏃🏼',
+          '🏃🏽',
+          '🏃🏾',
+          '🏃🏿',
+          '🏃‍♂️',
+          '🏃‍♂',
+          '🏃🏻‍♂️',
+          '🏃🏻‍♂',
+          '🏃🏼‍♂️',
+          '🏃🏼‍♂',
+          '🏃🏽‍♂️',
+          '🏃🏽‍♂',
+          '🏃🏾‍♂️',
+          '🏃🏾‍♂',
+          '🏃🏿‍♂️',
+          '🏃🏿‍♂',
+          '🏃‍♀️',
+          '🏃‍♀',
+          '🏃🏻‍♀️',
+          '🏃🏻‍♀',
+          '🏃🏼‍♀️',
+          '🏃🏼‍♀',
+          '🏃🏽‍♀️',
+          '🏃🏽‍♀',
+          '🏃🏾‍♀️',
+          '🏃🏾‍♀',
+          '🏃🏿‍♀️',
+          '🏃🏿‍♀',
           '💃',
+          '💃🏻',
+          '💃🏼',
+          '💃🏽',
+          '💃🏾',
+          '💃🏿',
+          '🕺',
+          '🕺🏻',
+          '🕺🏼',
+          '🕺🏽',
+          '🕺🏾',
+          '🕺🏿',
+          '🕴️',
+          '🕴',
+          '🕴🏻',
+          '🕴🏼',
+          '🕴🏽',
+          '🕴🏾',
+          '🕴🏿',
           '👯',
+          '👯‍♂️',
+          '👯‍♂',
+          '👯‍♀️',
+          '👯‍♀',
+          '🧖',
+          '🧖🏻',
+          '🧖🏼',
+          '🧖🏽',
+          '🧖🏾',
+          '🧖🏿',
+          '🧖‍♂️',
+          '🧖‍♂',
+          '🧖🏻‍♂️',
+          '🧖🏻‍♂',
+          '🧖🏼‍♂️',
+          '🧖🏼‍♂',
+          '🧖🏽‍♂️',
+          '🧖🏽‍♂',
+          '🧖🏾‍♂️',
+          '🧖🏾‍♂',
+          '🧖🏿‍♂️',
+          '🧖🏿‍♂',
+          '🧖‍♀️',
+          '🧖‍♀',
+          '🧖🏻‍♀️',
+          '🧖🏻‍♀',
+          '🧖🏼‍♀️',
+          '🧖🏼‍♀',
+          '🧖🏽‍♀️',
+          '🧖🏽‍♀',
+          '🧖🏾‍♀️',
+          '🧖🏾‍♀',
+          '🧖🏿‍♀️',
+          '🧖🏿‍♀',
+          '🧗',
+          '🧗🏻',
+          '🧗🏼',
+          '🧗🏽',
+          '🧗🏾',
+          '🧗🏿',
+          '🧗‍♂️',
+          '🧗‍♂',
+          '🧗🏻‍♂️',
+          '🧗🏻‍♂',
+          '🧗🏼‍♂️',
+          '🧗🏼‍♂',
+          '🧗🏽‍♂️',
+          '🧗🏽‍♂',
+          '🧗🏾‍♂️',
+          '🧗🏾‍♂',
+          '🧗🏿‍♂️',
+          '🧗🏿‍♂',
+          '🧗‍♀️',
+          '🧗‍♀',
+          '🧗🏻‍♀️',
+          '🧗🏻‍♀',
+          '🧗🏼‍♀️',
+          '🧗🏼‍♀',
+          '🧗🏽‍♀️',
+          '🧗🏽‍♀',
+          '🧗🏾‍♀️',
+          '🧗🏾‍♀',
+          '🧗🏿‍♀️',
+          '🧗🏿‍♀',
+          '🤺',
           '🏇',
+          '🏇🏻',
+          '🏇🏼',
+          '🏇🏽',
+          '🏇🏾',
+          '🏇🏿',
+          '⛷️',
+          '⛷',
+          '🏂',
+          '🏂🏻',
+          '🏂🏼',
+          '🏂🏽',
+          '🏂🏾',
+          '🏂🏿',
+          '🏌️',
+          '🏌',
+          '🏌🏻',
+          '🏌🏼',
+          '🏌🏽',
+          '🏌🏾',
+          '🏌🏿',
+          '🏌️‍♂️',
+          '🏌‍♂️',
+          '🏌️‍♂',
+          '🏌‍♂',
+          '🏌🏻‍♂️',
+          '🏌🏻‍♂',
+          '🏌🏼‍♂️',
+          '🏌🏼‍♂',
+          '🏌🏽‍♂️',
+          '🏌🏽‍♂',
+          '🏌🏾‍♂️',
+          '🏌🏾‍♂',
+          '🏌🏿‍♂️',
+          '🏌🏿‍♂',
+          '🏌️‍♀️',
+          '🏌‍♀️',
+          '🏌️‍♀',
+          '🏌‍♀',
+          '🏌🏻‍♀️',
+          '🏌🏻‍♀',
+          '🏌🏼‍♀️',
+          '🏌🏼‍♀',
+          '🏌🏽‍♀️',
+          '🏌🏽‍♀',
+          '🏌🏾‍♀️',
+          '🏌🏾‍♀',
+          '🏌🏿‍♀️',
+          '🏌🏿‍♀',
           '🏄',
+          '🏄🏻',
+          '🏄🏼',
+          '🏄🏽',
+          '🏄🏾',
+          '🏄🏿',
+          '🏄‍♂️',
+          '🏄‍♂',
+          '🏄🏻‍♂️',
+          '🏄🏻‍♂',
+          '🏄🏼‍♂️',
+          '🏄🏼‍♂',
+          '🏄🏽‍♂️',
+          '🏄🏽‍♂',
+          '🏄🏾‍♂️',
+          '🏄🏾‍♂',
+          '🏄🏿‍♂️',
+          '🏄🏿‍♂',
+          '🏄‍♀️',
+          '🏄‍♀',
+          '🏄🏻‍♀️',
+          '🏄🏻‍♀',
+          '🏄🏼‍♀️',
+          '🏄🏼‍♀',
+          '🏄🏽‍♀️',
+          '🏄🏽‍♀',
+          '🏄🏾‍♀️',
+          '🏄🏾‍♀',
+          '🏄🏿‍♀️',
+          '🏄🏿‍♀',
+          '🚣',
+          '🚣🏻',
+          '🚣🏼',
+          '🚣🏽',
+          '🚣🏾',
+          '🚣🏿',
+          '🚣‍♂️',
+          '🚣‍♂',
+          '🚣🏻‍♂️',
+          '🚣🏻‍♂',
+          '🚣🏼‍♂️',
+          '🚣🏼‍♂',
+          '🚣🏽‍♂️',
+          '🚣🏽‍♂',
+          '🚣🏾‍♂️',
+          '🚣🏾‍♂',
+          '🚣🏿‍♂️',
+          '🚣🏿‍♂',
+          '🚣‍♀️',
+          '🚣‍♀',
+          '🚣🏻‍♀️',
+          '🚣🏻‍♀',
+          '🚣🏼‍♀️',
+          '🚣🏼‍♀',
+          '🚣🏽‍♀️',
+          '🚣🏽‍♀',
+          '🚣🏾‍♀️',
+          '🚣🏾‍♀',
+          '🚣🏿‍♀️',
+          '🚣🏿‍♀',
+          '🏊',
+          '🏊🏻',
+          '🏊🏼',
+          '🏊🏽',
+          '🏊🏾',
+          '🏊🏿',
+          '🏊‍♂️',
+          '🏊‍♂',
+          '🏊🏻‍♂️',
+          '🏊🏻‍♂',
+          '🏊🏼‍♂️',
+          '🏊🏼‍♂',
+          '🏊🏽‍♂️',
+          '🏊🏽‍♂',
+          '🏊🏾‍♂️',
+          '🏊🏾‍♂',
+          '🏊🏿‍♂️',
+          '🏊🏿‍♂',
+          '🏊‍♀️',
+          '🏊‍♀',
+          '🏊🏻‍♀️',
+          '🏊🏻‍♀',
+          '🏊🏼‍♀️',
+          '🏊🏼‍♀',
+          '🏊🏽‍♀️',
+          '🏊🏽‍♀',
+          '🏊🏾‍♀️',
+          '🏊🏾‍♀',
+          '🏊🏿‍♀️',
+          '🏊🏿‍♀',
+          '⛹️',
+          '⛹',
+          '⛹🏻',
+          '⛹🏼',
+          '⛹🏽',
+          '⛹🏾',
+          '⛹🏿',
+          '⛹️‍♂️',
+          '⛹‍♂️',
+          '⛹️‍♂',
+          '⛹‍♂',
+          '⛹🏻‍♂️',
+          '⛹🏻‍♂',
+          '⛹🏼‍♂️',
+          '⛹🏼‍♂',
+          '⛹🏽‍♂️',
+          '⛹🏽‍♂',
+          '⛹🏾‍♂️',
+          '⛹🏾‍♂',
+          '⛹🏿‍♂️',
+          '⛹🏿‍♂',
+          '⛹️‍♀️',
+          '⛹‍♀️',
+          '⛹️‍♀',
+          '⛹‍♀',
+          '⛹🏻‍♀️',
+          '⛹🏻‍♀',
+          '⛹🏼‍♀️',
+          '⛹🏼‍♀',
+          '⛹🏽‍♀️',
+          '⛹🏽‍♀',
+          '⛹🏾‍♀️',
+          '⛹🏾‍♀',
+          '⛹🏿‍♀️',
+          '⛹🏿‍♀',
+          '🏋️',
+          '🏋',
+          '🏋🏻',
+          '🏋🏼',
+          '🏋🏽',
+          '🏋🏾',
+          '🏋🏿',
+          '🏋️‍♂️',
+          '🏋‍♂️',
+          '🏋️‍♂',
+          '🏋‍♂',
+          '🏋🏻‍♂️',
+          '🏋🏻‍♂',
+          '🏋🏼‍♂️',
+          '🏋🏼‍♂',
+          '🏋🏽‍♂️',
+          '🏋🏽‍♂',
+          '🏋🏾‍♂️',
+          '🏋🏾‍♂',
+          '🏋🏿‍♂️',
+          '🏋🏿‍♂',
+          '🏋️‍♀️',
+          '🏋‍♀️',
+          '🏋️‍♀',
+          '🏋‍♀',
+          '🏋🏻‍♀️',
+          '🏋🏻‍♀',
+          '🏋🏼‍♀️',
+          '🏋🏼‍♀',
+          '🏋🏽‍♀️',
+          '🏋🏽‍♀',
+          '🏋🏾‍♀️',
+          '🏋🏾‍♀',
+          '🏋🏿‍♀️',
+          '🏋🏿‍♀',
+          '🚴',
+          '🚴🏻',
+          '🚴🏼',
+          '🚴🏽',
+          '🚴🏾',
+          '🚴🏿',
+          '🚴‍♂️',
+          '🚴‍♂',
+          '🚴🏻‍♂️',
+          '🚴🏻‍♂',
+          '🚴🏼‍♂️',
+          '🚴🏼‍♂',
+          '🚴🏽‍♂️',
+          '🚴🏽‍♂',
+          '🚴🏾‍♂️',
+          '🚴🏾‍♂',
+          '🚴🏿‍♂️',
+          '🚴🏿‍♂',
+          '🚴‍♀️',
+          '🚴‍♀',
+          '🚴🏻‍♀️',
+          '🚴🏻‍♀',
+          '🚴🏼‍♀️',
+          '🚴🏼‍♀',
+          '🚴🏽‍♀️',
+          '🚴🏽‍♀',
+          '🚴🏾‍♀️',
+          '🚴🏾‍♀',
+          '🚴🏿‍♀️',
+          '🚴🏿‍♀',
+          '🚵',
+          '🚵🏻',
+          '🚵🏼',
+          '🚵🏽',
+          '🚵🏾',
+          '🚵🏿',
+          '🚵‍♂️',
+          '🚵‍♂',
+          '🚵🏻‍♂️',
+          '🚵🏻‍♂',
+          '🚵🏼‍♂️',
+          '🚵🏼‍♂',
+          '🚵🏽‍♂️',
+          '🚵🏽‍♂',
+          '🚵🏾‍♂️',
+          '🚵🏾‍♂',
+          '🚵🏿‍♂️',
+          '🚵🏿‍♂',
+          '🚵‍♀️',
+          '🚵‍♀',
+          '🚵🏻‍♀️',
+          '🚵🏻‍♀',
+          '🚵🏼‍♀️',
+          '🚵🏼‍♀',
+          '🚵🏽‍♀️',
+          '🚵🏽‍♀',
+          '🚵🏾‍♀️',
+          '🚵🏾‍♀',
+          '🚵🏿‍♀️',
+          '🚵🏿‍♀',
+          '🤸',
+          '🤸🏻',
+          '🤸🏼',
+          '🤸🏽',
+          '🤸🏾',
+          '🤸🏿',
+          '🤸‍♂️',
+          '🤸‍♂',
+          '🤸🏻‍♂️',
+          '🤸🏻‍♂',
+          '🤸🏼‍♂️',
+          '🤸🏼‍♂',
+          '🤸🏽‍♂️',
+          '🤸🏽‍♂',
+          '🤸🏾‍♂️',
+          '🤸🏾‍♂',
+          '🤸🏿‍♂️',
+          '🤸🏿‍♂',
+          '🤸‍♀️',
+          '🤸‍♀',
+          '🤸🏻‍♀️',
+          '🤸🏻‍♀',
+          '🤸🏼‍♀️',
+          '🤸🏼‍♀',
+          '🤸🏽‍♀️',
+          '🤸🏽‍♀',
+          '🤸🏾‍♀️',
+          '🤸🏾‍♀',
+          '🤸🏿‍♀️',
+          '🤸🏿‍♀',
+          '🤼',
+          '🤼‍♂️',
+          '🤼‍♂',
+          '🤼‍♀️',
+          '🤼‍♀',
+          '🤽',
+          '🤽🏻',
+          '🤽🏼',
+          '🤽🏽',
+          '🤽🏾',
+          '🤽🏿',
+          '🤽‍♂️',
+          '🤽‍♂',
+          '🤽🏻‍♂️',
+          '🤽🏻‍♂',
+          '🤽🏼‍♂️',
+          '🤽🏼‍♂',
+          '🤽🏽‍♂️',
+          '🤽🏽‍♂',
+          '🤽🏾‍♂️',
+          '🤽🏾‍♂',
+          '🤽🏿‍♂️',
+          '🤽🏿‍♂',
+          '🤽‍♀️',
+          '🤽‍♀',
+          '🤽🏻‍♀️',
+          '🤽🏻‍♀',
+          '🤽🏼‍♀️',
+          '🤽🏼‍♀',
+          '🤽🏽‍♀️',
+          '🤽🏽‍♀',
+          '🤽🏾‍♀️',
+          '🤽🏾‍♀',
+          '🤽🏿‍♀️',
+          '🤽🏿‍♀',
+          '🤾',
+          '🤾🏻',
+          '🤾🏼',
+          '🤾🏽',
+          '🤾🏾',
+          '🤾🏿',
+          '🤾‍♂️',
+          '🤾‍♂',
+          '🤾🏻‍♂️',
+          '🤾🏻‍♂',
+          '🤾🏼‍♂️',
+          '🤾🏼‍♂',
+          '🤾🏽‍♂️',
+          '🤾🏽‍♂',
+          '🤾🏾‍♂️',
+          '🤾🏾‍♂',
+          '🤾🏿‍♂️',
+          '🤾🏿‍♂',
+          '🤾‍♀️',
+          '🤾‍♀',
+          '🤾🏻‍♀️',
+          '🤾🏻‍♀',
+          '🤾🏼‍♀️',
+          '🤾🏼‍♀',
+          '🤾🏽‍♀️',
+          '🤾🏽‍♀',
+          '🤾🏾‍♀️',
+          '🤾🏾‍♀',
+          '🤾🏿‍♀️',
+          '🤾🏿‍♀',
+          '🤹',
+          '🤹🏻',
+          '🤹🏼',
+          '🤹🏽',
+          '🤹🏾',
+          '🤹🏿',
+          '🤹‍♂️',
+          '🤹‍♂',
+          '🤹🏻‍♂️',
+          '🤹🏻‍♂',
+          '🤹🏼‍♂️',
+          '🤹🏼‍♂',
+          '🤹🏽‍♂️',
+          '🤹🏽‍♂',
+          '🤹🏾‍♂️',
+          '🤹🏾‍♂',
+          '🤹🏿‍♂️',
+          '🤹🏿‍♂',
+          '🤹‍♀️',
+          '🤹‍♀',
+          '🤹🏻‍♀️',
+          '🤹🏻‍♀',
+          '🤹🏼‍♀️',
+          '🤹🏼‍♀',
+          '🤹🏽‍♀️',
+          '🤹🏽‍♀',
+          '🤹🏾‍♀️',
+          '🤹🏾‍♀',
+          '🤹🏿‍♀️',
+          '🤹🏿‍♀',
+          '🧘',
+          '🧘🏻',
+          '🧘🏼',
+          '🧘🏽',
+          '🧘🏾',
+          '🧘🏿',
+          '🧘‍♂️',
+          '🧘‍♂',
+          '🧘🏻‍♂️',
+          '🧘🏻‍♂',
+          '🧘🏼‍♂️',
+          '🧘🏼‍♂',
+          '🧘🏽‍♂️',
+          '🧘🏽‍♂',
+          '🧘🏾‍♂️',
+          '🧘🏾‍♂',
+          '🧘🏿‍♂️',
+          '🧘🏿‍♂',
+          '🧘‍♀️',
+          '🧘‍♀',
+          '🧘🏻‍♀️',
+          '🧘🏻‍♀',
+          '🧘🏼‍♀️',
+          '🧘🏼‍♀',
+          '🧘🏽‍♀️',
+          '🧘🏽‍♀',
+          '🧘🏾‍♀️',
+          '🧘🏾‍♀',
+          '🧘🏿‍♀️',
+          '🧘🏿‍♀',
+          '🛀',
+          '🛀🏻',
+          '🛀🏼',
+          '🛀🏽',
+          '🛀🏾',
+          '🛀🏿',
+          '🛌',
+          '🛌🏻',
+          '🛌🏼',
+          '🛌🏽',
+          '🛌🏾',
+          '🛌🏿',
+          '🧑‍🤝‍🧑',
+          '🧑🏻‍🤝‍🧑🏻',
+          '🧑🏼‍🤝‍🧑🏻',
+          '🧑🏼‍🤝‍🧑🏼',
+          '🧑🏽‍🤝‍🧑🏻',
+          '🧑🏽‍🤝‍🧑🏼',
+          '🧑🏽‍🤝‍🧑🏽',
+          '🧑🏾‍🤝‍🧑🏻',
+          '🧑🏾‍🤝‍🧑🏼',
+          '🧑🏾‍🤝‍🧑🏽',
+          '🧑🏾‍🤝‍🧑🏾',
+          '🧑🏿‍🤝‍🧑🏻',
+          '🧑🏿‍🤝‍🧑🏼',
+          '🧑🏿‍🤝‍🧑🏽',
+          '🧑🏿‍🤝‍🧑🏾',
+          '🧑🏿‍🤝‍🧑🏿',
           '👭',
+          '👭🏻',
+          '👩🏼‍🤝‍👩🏻',
+          '👭🏼',
+          '👩🏽‍🤝‍👩🏻',
+          '👩🏽‍🤝‍👩🏼',
+          '👭🏽',
+          '👩🏾‍🤝‍👩🏻',
+          '👩🏾‍🤝‍👩🏼',
+          '👩🏾‍🤝‍👩🏽',
+          '👭🏾',
+          '👩🏿‍🤝‍👩🏻',
+          '👩🏿‍🤝‍👩🏼',
+          '👩🏿‍🤝‍👩🏽',
+          '👩🏿‍🤝‍👩🏾',
+          '👭🏿',
           '👫',
+          '👫🏻',
+          '👩🏻‍🤝‍👨🏼',
+          '👩🏻‍🤝‍👨🏽',
+          '👩🏻‍🤝‍👨🏾',
+          '👩🏻‍🤝‍👨🏿',
+          '👩🏼‍🤝‍👨🏻',
+          '👫🏼',
+          '👩🏼‍🤝‍👨🏽',
+          '👩🏼‍🤝‍👨🏾',
+          '👩🏼‍🤝‍👨🏿',
+          '👩🏽‍🤝‍👨🏻',
+          '👩🏽‍🤝‍👨🏼',
+          '👫🏽',
+          '👩🏽‍🤝‍👨🏾',
+          '👩🏽‍🤝‍👨🏿',
+          '👩🏾‍🤝‍👨🏻',
+          '👩🏾‍🤝‍👨🏼',
+          '👩🏾‍🤝‍👨🏽',
+          '👫🏾',
+          '👩🏾‍🤝‍👨🏿',
+          '👩🏿‍🤝‍👨🏻',
+          '👩🏿‍🤝‍👨🏼',
+          '👩🏿‍🤝‍👨🏽',
+          '👩🏿‍🤝‍👨🏾',
+          '👫🏿',
           '👬',
+          '👬🏻',
+          '👨🏼‍🤝‍👨🏻',
+          '👬🏼',
+          '👨🏽‍🤝‍👨🏻',
+          '👨🏽‍🤝‍👨🏼',
+          '👬🏽',
+          '👨🏾‍🤝‍👨🏻',
+          '👨🏾‍🤝‍👨🏼',
+          '👨🏾‍🤝‍👨🏽',
+          '👬🏾',
+          '👨🏿‍🤝‍👨🏻',
+          '👨🏿‍🤝‍👨🏼',
+          '👨🏿‍🤝‍👨🏽',
+          '👨🏿‍🤝‍👨🏾',
+          '👬🏿',
           '💏',
+          '👩‍❤️‍💋‍👨',
+          '👩‍❤‍💋‍👨',
+          '👨‍❤️‍💋‍👨',
+          '👨‍❤‍💋‍👨',
+          '👩‍❤️‍💋‍👩',
+          '👩‍❤‍💋‍👩',
           '💑',
+          '👩‍❤️‍👨',
+          '👩‍❤‍👨',
+          '👨‍❤️‍👨',
+          '👨‍❤‍👨',
+          '👩‍❤️‍👩',
+          '👩‍❤‍👩',
           '👪',
-          '👽',
+          '👨‍👩‍👦',
+          '👨‍👩‍👧',
+          '👨‍👩‍👧‍👦',
+          '👨‍👩‍👦‍👦',
+          '👨‍👩‍👧‍👧',
+          '👨‍👨‍👦',
+          '👨‍👨‍👧',
+          '👨‍👨‍👧‍👦',
+          '👨‍👨‍👦‍👦',
+          '👨‍👨‍👧‍👧',
+          '👩‍👩‍👦',
+          '👩‍👩‍👧',
+          '👩‍👩‍👧‍👦',
+          '👩‍👩‍👦‍👦',
+          '👩‍👩‍👧‍👧',
+          '👨‍👦',
+          '👨‍👦‍👦',
+          '👨‍👧',
+          '👨‍👧‍👦',
+          '👨‍👧‍👧',
+          '👩‍👦',
+          '👩‍👦‍👦',
+          '👩‍👧',
+          '👩‍👧‍👦',
+          '👩‍👧‍👧',
+          '🗣️',
+          '🗣',
+          '👤',
+          '👥',
           '👣',
+          '🏻',
+          '🏼',
+          '🏽',
+          '🏾',
+          '🏿',
+          '🦰',
+          '🦱',
+          '🦳',
+          '🦲',
+          '🐵',
+          '🐒',
+          '🦍',
+          '🦧',
+          '🐶',
+          '🐕',
+          '🦮',
+          '🐕‍🦺',
+          '🐩',
+          '🐺',
+          '🦊',
+          '🦝',
+          '🐱',
+          '🐈',
+          '🦁',
+          '🐯',
+          '🐅',
+          '🐆',
+          '🐴',
+          '🐎',
+          '🦄',
+          '🦓',
+          '🦌',
+          '🐮',
+          '🐂',
+          '🐃',
+          '🐄',
+          '🐷',
+          '🐖',
+          '🐗',
+          '🐽',
+          '🐏',
+          '🐑',
+          '🐐',
+          '🐪',
+          '🐫',
+          '🦙',
+          '🦒',
+          '🐘',
+          '🦏',
+          '🦛',
+          '🐭',
+          '🐁',
+          '🐀',
+          '🐹',
+          '🐰',
+          '🐇',
+          '🐿️',
+          '🐿',
+          '🦔',
+          '🦇',
+          '🐻',
+          '🐨',
+          '🐼',
+          '🦥',
+          '🦦',
+          '🦨',
+          '🦘',
+          '🦡',
+          '🐾',
+          '🦃',
+          '🐔',
+          '🐓',
+          '🐣',
+          '🐤',
+          '🐥',
+          '🐦',
+          '🐧',
+          '🕊️',
+          '🕊',
+          '🦅',
+          '🦆',
+          '🦢',
+          '🦉',
+          '🦩',
+          '🦚',
+          '🦜',
+          '🐸',
+          '🐊',
+          '🐢',
+          '🦎',
+          '🐍',
+          '🐲',
+          '🐉',
+          '🦕',
+          '🦖',
+          '🐳',
+          '🐋',
+          '🐬',
+          '🐟',
+          '🐠',
+          '🐡',
+          '🦈',
+          '🐙',
+          '🐚',
+          '🐌',
+          '🦋',
+          '🐛',
+          '🐜',
+          '🐝',
           '🐞',
+          '🦗',
+          '🕷️',
+          '🕷',
+          '🕸️',
+          '🕸',
+          '🦂',
+          '🦟',
+          '🦠',
+          '💐',
+          '🌸',
+          '💮',
+          '🏵️',
+          '🏵',
+          '🌹',
+          '🥀',
+          '🌺',
+          '🌻',
+          '🌼',
+          '🌷',
           '🌱',
           '🌲',
+          '🌳',
+          '🌴',
+          '🌵',
+          '🌾',
+          '🌿',
+          '☘️',
+          '☘',
           '🍀',
           '🍁',
+          '🍂',
+          '🍃',
+          '🍇',
+          '🍈',
+          '🍉',
+          '🍊',
+          '🍋',
+          '🍌',
+          '🍍',
+          '🥭',
+          '🍎',
+          '🍏',
+          '🍐',
+          '🍑',
+          '🍒',
+          '🍓',
+          '🥝',
+          '🍅',
+          '🥥',
+          '🥑',
+          '🍆',
+          '🥔',
+          '🥕',
+          '🌽',
+          '🌶️',
+          '🌶',
+          '🥒',
+          '🥬',
+          '🥦',
+          '🧄',
+          '🧅',
+          '🍄',
+          '🥜',
+          '🌰',
+          '🍞',
+          '🥐',
+          '🥖',
+          '🥨',
+          '🥯',
+          '🥞',
+          '🧇',
+          '🧀',
+          '🍖',
+          '🍗',
+          '🥩',
+          '🥓',
           '🍔',
+          '🍟',
           '🍕',
+          '🌭',
+          '🥪',
+          '🌮',
+          '🌯',
+          '🥙',
+          '🧆',
+          '🥚',
+          '🍳',
+          '🥘',
+          '🍲',
+          '🥣',
+          '🥗',
+          '🍿',
+          '🧈',
+          '🧂',
+          '🥫',
+          '🍱',
+          '🍘',
+          '🍙',
           '🍚',
+          '🍛',
+          '🍜',
+          '🍝',
+          '🍠',
+          '🍢',
+          '🍣',
+          '🍤',
+          '🍥',
+          '🥮',
+          '🍡',
+          '🥟',
+          '🥠',
+          '🥡',
+          '🦀',
+          '🦞',
+          '🦐',
+          '🦑',
+          '🦪',
+          '🍦',
+          '🍧',
+          '🍨',
           '🍩',
           '🍪',
           '🎂',
+          '🍰',
+          '🧁',
+          '🥧',
+          '🍫',
+          '🍬',
+          '🍭',
+          '🍮',
+          '🍯',
+          '🍼',
+          '🥛',
           '☕',
+          '🍵',
+          '🍶',
+          '🍾',
           '🍷',
           '🍸',
+          '🍹',
           '🍺',
           '🍻',
+          '🥂',
+          '🥃',
+          '🥤',
+          '🧃',
+          '🧉',
+          '🧊',
+          '🥢',
+          '🍽️',
+          '🍽',
+          '🍴',
+          '🥄',
+          '🔪',
+          '🏺',
           '🌍',
           '🌎',
           '🌏',
           '🌐',
+          '🗺️',
+          '🗺',
+          '🗾',
+          '🧭',
+          '🏔️',
+          '🏔',
+          '⛰️',
+          '⛰',
+          '🌋',
+          '🗻',
+          '🏕️',
+          '🏕',
+          '🏖️',
+          '🏖',
+          '🏜️',
+          '🏜',
+          '🏝️',
+          '🏝',
+          '🏞️',
+          '🏞',
+          '🏟️',
+          '🏟',
+          '🏛️',
+          '🏛',
+          '🏗️',
+          '🏗',
+          '🧱',
+          '🏘️',
+          '🏘',
+          '🏚️',
+          '🏚',
+          '🏠',
+          '🏡',
+          '🏢',
+          '🏣',
+          '🏤',
+          '🏥',
+          '🏦',
+          '🏨',
+          '🏩',
+          '🏪',
+          '🏫',
+          '🏬',
+          '🏭',
+          '🏯',
+          '🏰',
+          '💒',
+          '🗼',
+          '🗽',
+          '⛪',
+          '🕌',
+          '🛕',
+          '🕍',
+          '⛩️',
+          '⛩',
+          '🕋',
+          '⛲',
+          '⛺',
+          '🌁',
+          '🌃',
+          '🏙️',
+          '🏙',
+          '🌄',
+          '🌅',
+          '🌆',
+          '🌇',
+          '🌉',
+          '♨️',
+          '♨',
+          '🎠',
+          '🎡',
+          '🎢',
+          '💈',
+          '🎪',
+          '🚂',
+          '🚃',
+          '🚄',
+          '🚅',
+          '🚆',
+          '🚇',
+          '🚈',
+          '🚉',
+          '🚊',
+          '🚝',
+          '🚞',
+          '🚋',
+          '🚌',
+          '🚍',
+          '🚎',
+          '🚐',
           '🚑',
           '🚒',
           '🚓',
+          '🚔',
+          '🚕',
+          '🚖',
+          '🚗',
+          '🚘',
+          '🚙',
+          '🚚',
+          '🚛',
           '🚜',
+          '🏎️',
+          '🏎',
+          '🏍️',
+          '🏍',
+          '🛵',
+          '🦽',
+          '🦼',
+          '🛺',
+          '🚲',
+          '🛴',
+          '🛹',
+          '🚏',
+          '🛣️',
+          '🛣',
+          '🛤️',
+          '🛤',
+          '🛢️',
+          '🛢',
+          '⛽',
           '🚨',
+          '🚥',
           '🚦',
+          '🛑',
           '🚧',
           '⚓',
+          '⛵',
+          '🛶',
+          '🚤',
+          '🛳️',
+          '🛳',
+          '⛴️',
+          '⛴',
+          '🛥️',
+          '🛥',
+          '🚢',
+          '✈️',
           '✈',
-          null,
+          '🛩️',
+          '🛩',
+          '🛫',
+          '🛬',
+          '🪂',
+          '💺',
+          '🚁',
+          '🚟',
+          '🚠',
+          '🚡',
+          '🛰️',
+          '🛰',
           '🚀',
+          '🛸',
+          '🛎️',
+          '🛎',
+          '🧳',
+          '⌛',
           '⏳',
+          '⌚',
           '⏰',
+          '⏱️',
+          '⏱',
+          '⏲️',
+          '⏲',
+          '🕰️',
+          '🕰',
+          '🕛',
+          '🕧',
+          '🕐',
+          '🕜',
+          '🕑',
+          '🕝',
+          '🕒',
+          '🕞',
+          '🕓',
+          '🕟',
+          '🕔',
+          '🕠',
+          '🕕',
+          '🕡',
+          '🕖',
+          '🕢',
+          '🕗',
+          '🕣',
+          '🕘',
+          '🕤',
+          '🕙',
+          '🕥',
+          '🕚',
+          '🕦',
+          '🌑',
+          '🌒',
+          '🌓',
+          '🌔',
+          '🌕',
+          '🌖',
+          '🌗',
+          '🌘',
           '🌙',
+          '🌚',
+          '🌛',
+          '🌜',
+          '🌡️',
+          '🌡',
+          '☀️',
           '☀',
+          '🌝',
+          '🌞',
+          '🪐',
           '⭐',
           '🌟',
+          '🌠',
+          '🌌',
+          '☁️',
+          '☁',
+          '⛅',
+          '⛈️',
+          '⛈',
+          '🌤️',
+          '🌤',
+          '🌥️',
+          '🌥',
+          '🌦️',
+          '🌦',
+          '🌧️',
+          '🌧',
+          '🌨️',
+          '🌨',
+          '🌩️',
+          '🌩',
+          '🌪️',
+          '🌪',
+          '🌫️',
+          '🌫',
+          '🌬️',
+          '🌬',
+          '🌀',
           '🌈',
+          '🌂',
+          '☂️',
+          '☂',
           '☔',
+          '⛱️',
+          '⛱',
           '⚡',
+          '❄️',
           '❄',
+          '☃️',
+          '☃',
           '⛄',
+          '☄️',
+          '☄',
           '🔥',
           '💧',
           '🌊',
           '🎃',
           '🎄',
+          '🎆',
+          '🎇',
+          '🧨',
           '✨',
           '🎈',
           '🎉',
           '🎊',
+          '🎋',
+          '🎍',
+          '🎎',
           '🎏',
+          '🎐',
+          '🎑',
+          '🧧',
           '🎀',
           '🎁',
+          '🎗️',
+          '🎗',
+          '🎟️',
+          '🎟',
+          '🎫',
+          '🎖️',
+          '🎖',
           '🏆',
+          '🏅',
+          '🥇',
+          '🥈',
+          '🥉',
+          '⚽',
+          '⚾',
+          '🥎',
+          '🏀',
+          '🏐',
+          '🏈',
+          '🏉',
+          '🎾',
+          '🥏',
+          '🎳',
+          '🏏',
+          '🏑',
+          '🏒',
+          '🥍',
+          '🏓',
+          '🏸',
+          '🥊',
+          '🥋',
+          '🥅',
+          '⛳',
+          '⛸️',
+          '⛸',
+          '🎣',
+          '🤿',
+          '🎽',
+          '🎿',
+          '🛷',
+          '🥌',
           '🎯',
+          '🪀',
+          '🪁',
           '🎱',
           '🔮',
+          '🧿',
           '🎮',
+          '🕹️',
+          '🕹',
           '🎰',
           '🎲',
+          '🧩',
+          '🧸',
+          '♠️',
+          '♠',
+          '♥️',
+          '♥',
+          '♦️',
+          '♦',
+          '♣️',
+          '♣',
+          '♟️',
+          '♟',
+          '🃏',
+          '🀄',
+          '🎴',
           '🎭',
+          '🖼️',
+          '🖼',
           '🎨',
+          '🧵',
+          '🧶',
           '👓',
+          '🕶️',
+          '🕶',
+          '🥽',
+          '🥼',
+          '🦺',
           '👔',
+          '👕',
+          '👖',
+          '🧣',
+          '🧤',
+          '🧥',
+          '🧦',
+          '👗',
+          '👘',
+          '🥻',
+          '🩱',
+          '🩲',
+          '🩳',
+          '👙',
+          '👚',
+          '👛',
+          '👜',
+          '👝',
+          '🛍️',
+          '🛍',
+          '🎒',
+          '👞',
+          '👟',
+          '🥾',
+          '🥿',
           '👠',
+          '👡',
+          '🩰',
+          '👢',
           '👑',
+          '👒',
           '🎩',
           '🎓',
+          '🧢',
+          '⛑️',
+          '⛑',
+          '📿',
           '💄',
           '💍',
           '💎',
+          '🔇',
+          '🔈',
+          '🔉',
+          '🔊',
           '📢',
+          '📣',
+          '📯',
+          '🔔',
+          '🔕',
+          '🎼',
           '🎵',
           '🎶',
+          '🎙️',
+          '🎙',
+          '🎚️',
+          '🎚',
+          '🎛️',
+          '🎛',
           '🎤',
+          '🎧',
+          '📻',
           '🎷',
           '🎸',
+          '🎹',
           '🎺',
+          '🎻',
+          '🪕',
+          '🥁',
+          '📱',
+          '📲',
+          '☎️',
+          '☎',
+          '📞',
+          '📟',
+          '📠',
           '🔋',
           '🔌',
+          '💻',
+          '🖥️',
+          '🖥',
+          '🖨️',
+          '🖨',
+          '⌨️',
+          '⌨',
+          '🖱️',
+          '🖱',
+          '🖲️',
+          '🖲',
+          '💽',
           '💾',
+          '💿',
+          '📀',
+          '🧮',
+          '🎥',
+          '🎞️',
+          '🎞',
+          '📽️',
+          '📽',
+          '🎬',
+          '📺',
+          '📷',
+          '📸',
+          '📹',
+          '📼',
+          '🔍',
+          '🔎',
+          '🕯️',
+          '🕯',
           '💡',
           '🔦',
+          '🏮',
+          '🪔',
+          '📔',
+          '📕',
           '📖',
+          '📗',
+          '📘',
+          '📙',
           '📚',
+          '📓',
+          '📒',
+          '📃',
+          '📜',
+          '📄',
           '📰',
+          '🗞️',
+          '🗞',
+          '📑',
+          '🔖',
+          '🏷️',
+          '🏷',
           '💰',
           '💴',
           '💵',
           '💶',
           '💷',
           '💸',
+          '💳',
+          '🧾',
+          '💹',
+          '💱',
           '💲',
+          '✉️',
+          '✉',
+          '📧',
+          '📨',
+          '📩',
+          '📤',
+          '📥',
           '📦',
+          '📫',
+          '📪',
+          '📬',
+          '📭',
+          '📮',
+          '🗳️',
+          '🗳',
+          '✏️',
+          '✏',
+          '✒️',
+          '✒',
+          '🖋️',
+          '🖋',
+          '🖊️',
+          '🖊',
+          '🖌️',
+          '🖌',
+          '🖍️',
+          '🖍',
+          '📝',
+          '💼',
+          '📁',
+          '📂',
+          '🗂️',
+          '🗂',
+          '📅',
+          '📆',
+          '🗒️',
+          '🗒',
+          '🗓️',
+          '🗓',
+          '📇',
           '📈',
           '📉',
+          '📊',
+          '📋',
           '📌',
+          '📍',
+          '📎',
+          '🖇️',
+          '🖇',
+          '📏',
+          '📐',
+          '✂️',
+          '✂',
+          '🗃️',
+          '🗃',
+          '🗄️',
+          '🗄',
+          '🗑️',
+          '🗑',
           '🔒',
+          '🔓',
+          '🔏',
+          '🔐',
           '🔑',
+          '🗝️',
+          '🗝',
           '🔨',
+          '🪓',
+          '⛏️',
+          '⛏',
+          '⚒️',
+          '⚒',
+          '🛠️',
+          '🛠',
+          '🗡️',
+          '🗡',
+          '⚔️',
+          '⚔',
           '🔫',
+          '🏹',
+          '🛡️',
+          '🛡',
           '🔧',
+          '🔩',
+          '⚙️',
+          '⚙',
+          '🗜️',
+          '🗜',
+          '⚖️',
+          '⚖',
+          '🦯',
+          '🔗',
+          '⛓️',
+          '⛓',
+          '🧰',
+          '🧲',
+          '⚗️',
+          '⚗',
+          '🧪',
+          '🧫',
+          '🧬',
           '🔬',
           '🔭',
           '📡',
           '💉',
+          '🩸',
           '💊',
+          '🩹',
+          '🩺',
+          '🚪',
+          '🛏️',
+          '🛏',
+          '🛋️',
+          '🛋',
+          '🪑',
           '🚽',
+          '🚿',
+          '🛁',
+          '🪒',
+          '🧴',
+          '🧷',
+          '🧹',
+          '🧺',
+          '🧻',
+          '🧼',
+          '🧽',
+          '🧯',
+          '🛒',
           '🚬',
+          '⚰️',
+          '⚰',
+          '⚱️',
+          '⚱',
+          '🗿',
+          '🏧',
+          '🚮',
+          '🚰',
+          '♿',
+          '🚹',
+          '🚺',
+          '🚻',
+          '🚼',
+          '🚾',
+          '🛂',
+          '🛃',
+          '🛄',
+          '🛅',
+          '⚠️',
+          '⚠',
+          '🚸',
+          '⛔',
+          '🚫',
+          '🚳',
+          '🚭',
+          '🚯',
+          '🚱',
+          '🚷',
+          '📵',
+          '🔞',
+          '☢️',
+          '☢',
+          '☣️',
+          '☣',
+          '⬆️',
+          '⬆',
+          '↗️',
+          '↗',
+          '➡️',
+          '➡',
+          '↘️',
+          '↘',
+          '⬇️',
+          '⬇',
+          '↙️',
+          '↙',
+          '⬅️',
+          '⬅',
+          '↖️',
+          '↖',
+          '↕️',
+          '↕',
+          '↔️',
+          '↔',
+          '↩️',
+          '↩',
+          '↪️',
+          '↪',
+          '⤴️',
+          '⤴',
+          '⤵️',
+          '⤵',
+          '🔃',
+          '🔄',
+          '🔙',
+          '🔚',
+          '🔛',
+          '🔜',
+          '🔝',
+          '🛐',
+          '⚛️',
+          '⚛',
+          '🕉️',
+          '🕉',
+          '✡️',
+          '✡',
+          '☸️',
+          '☸',
+          '☯️',
+          '☯',
+          '✝️',
+          '✝',
+          '☦️',
+          '☦',
+          '☪️',
+          '☪',
+          '☮️',
+          '☮',
+          '🕎',
+          '🔯',
+          '♈',
+          '♉',
+          '♊',
+          '♋',
+          '♌',
+          '♍',
+          '♎',
+          '♏',
+          '♐',
+          '♑',
+          '♒',
+          '♓',
+          '⛎',
+          '🔀',
+          '🔁',
+          '🔂',
+          '▶️',
+          '▶',
+          '⏩',
+          '⏭️',
+          '⏭',
+          '⏯️',
+          '⏯',
+          '◀️',
+          '◀',
+          '⏪',
+          '⏮️',
+          '⏮',
+          '🔼',
+          '⏫',
+          '🔽',
+          '⏬',
+          '⏸️',
+          '⏸',
+          '⏹️',
+          '⏹',
+          '⏺️',
+          '⏺',
+          '⏏️',
+          '⏏',
+          '🎦',
+          '🔅',
+          '🔆',
+          '📶',
+          '📳',
+          '📴',
+          '♀️',
+          '♀',
+          '♂️',
+          '♂',
+          '⚕️',
+          '⚕',
+          '♾️',
+          '♾',
+          '♻️',
+          '♻',
+          '⚜️',
+          '⚜',
+          '🔱',
+          '📛',
+          '🔰',
+          '⭕',
+          '✅',
+          '☑️',
+          '☑',
+          '✔️',
+          '✔',
+          '✖️',
+          '✖',
+          '❌',
+          '❎',
+          '➕',
+          '➖',
+          '➗',
+          '➰',
+          '➿',
+          '〽️',
+          '〽',
+          '✳️',
+          '✳',
+          '✴️',
+          '✴',
+          '❇️',
+          '❇',
+          '‼️',
+          '‼',
+          '⁉️',
+          '⁉',
+          '❓',
+          '❔',
+          '❕',
+          '❗',
+          '〰️',
+          '〰',
+          '©️',
+          '©',
+          '®️',
+          '®',
+          '™️',
+          '™',
+          '#️⃣',
+          '#⃣',
+          '*️⃣',
+          '*⃣',
+          '0️⃣',
+          '0⃣',
+          '1️⃣',
+          '1⃣',
+          '2️⃣',
+          '2⃣',
+          '3️⃣',
+          '3⃣',
+          '4️⃣',
+          '4⃣',
+          '5️⃣',
+          '5⃣',
+          '6️⃣',
+          '6⃣',
+          '7️⃣',
+          '7⃣',
+          '8️⃣',
+          '8⃣',
+          '9️⃣',
+          '9⃣',
+          '🔟',
+          '🔠',
+          '🔡',
+          '🔢',
+          '🔣',
+          '🔤',
+          '🅰️',
+          '🅰',
+          '🆎',
+          '🅱️',
+          '🅱',
+          '🆑',
+          '🆒',
+          '🆓',
+          'ℹ️',
+          'ℹ',
+          '🆔',
+          'Ⓜ️',
+          'Ⓜ',
+          '🆕',
+          '🆖',
+          '🅾️',
+          '🅾',
+          '🆗',
+          '🅿️',
+          '🅿',
+          '🆘',
+          '🆙',
+          '🆚',
+          '🈁',
+          '🈂️',
+          '🈂',
+          '🈷️',
+          '🈷',
+          '🈶',
+          '🈯',
+          '🉐',
+          '🈹',
+          '🈚',
+          '🈲',
+          '🉑',
+          '🈸',
+          '🈴',
+          '🈳',
+          '㊗️',
+          '㊗',
+          '㊙️',
+          '㊙',
+          '🈺',
+          '🈵',
+          '🔴',
+          '🟠',
+          '🟡',
+          '🟢',
+          '🔵',
+          '🟣',
+          '🟤',
+          '⚫',
+          '⚪',
+          '🟥',
+          '🟧',
+          '🟨',
+          '🟩',
+          '🟦',
+          '🟪',
+          '🟫',
+          '⬛',
+          '⬜',
+          '◼️',
+          '◼',
+          '◻️',
+          '◻',
+          '◾',
+          '◽',
+          '▪️',
+          '▪',
+          '▫️',
+          '▫',
+          '🔶',
+          '🔷',
+          '🔸',
+          '🔹',
+          '🔺',
+          '🔻',
+          '💠',
+          '🔘',
+          '🔳',
+          '🔲',
           '🏁',
           '🚩',
-          '👋🏻',
-          '✋🏻',
-          '👌🏻',
-          '✌🏻',
-          '👈🏻',
-          '👉🏻',
-          '👆🏻',
-          '👇🏻',
-          '☝🏻',
-          '👍🏻',
-          '👎🏻',
-          '✊🏻',
-          '👊🏻',
-          '👏🏻',
-          '🙌🏻',
-          '👐🏻',
-          '🙏🏻',
-          '💅🏻',
-          '💪🏻',
-          '👂🏻',
-          '👃🏻',
-          '🙅🏻',
-          '🙆🏻',
-          '💁🏻',
-          '🙋🏻',
-          '🙇🏻',
-          '👸🏻',
-          '👰🏻',
-          '👼🏻',
-          '🎅🏻',
-          '💇🏻',
-          '🏃🏻',
-          '💃🏻',
-          '🏄🏻',
-          '👋🏼',
-          '✋🏼',
-          '👌🏼',
-          '✌🏼',
-          '👈🏼',
-          '👉🏼',
-          '👆🏼',
-          '👇🏼',
-          '☝🏼',
-          '👍🏼',
-          '👎🏼',
-          '✊🏼',
-          '👊🏼',
-          '👏🏼',
-          '🙌🏼',
-          '👐🏼',
-          '🙏🏼',
-          '💅🏼',
-          '💪🏼',
-          '👂🏼',
-          '👃🏼',
-          '🙅🏼',
-          '🙆🏼',
-          '💁🏼',
-          '🙋🏼',
-          '🙇🏼',
-          '👸🏼',
-          '👰🏼',
-          '👼🏼',
-          '🎅🏼',
-          '💇🏼',
-          '🏃🏼',
-          '💃🏼',
-          '🏄🏼',
-          '👋🏽',
-          '✋🏽',
-          '👌🏽',
-          '✌🏽',
-          '👈🏽',
-          '👉🏽',
-          '👆🏽',
-          '👇🏽',
-          '☝🏽',
-          '👍🏽',
-          '👎🏽',
-          '✊🏽',
-          '👊🏽',
-          '👏🏽',
-          '🙌🏽',
-          '👐🏽',
-          '🙏🏽',
-          '💅🏽',
-          '💪🏽',
-          '👂🏽',
-          '👃🏽',
-          '🙅🏽',
-          '🙆🏽',
-          '💁🏽',
-          '🙋🏽',
-          '🙇🏽',
-          '👸🏽',
-          '👰🏽',
-          '👼🏽',
-          '🎅🏽',
-          '💇🏽',
-          '🏃🏽',
-          '💃🏽',
-          '🏄🏽',
-          '👋🏾',
-          '✋🏾',
-          '👌🏾',
-          '✌🏾',
-          '👈🏾',
-          '👉🏾',
-          '👆🏾',
-          '👇🏾',
-          '☝🏾',
-          '👍🏾',
-          '👎🏾',
-          '✊🏾',
-          '👊🏾',
-          '👏🏾',
-          '🙌🏾',
-          '👐🏾',
-          '🙏🏾',
-          '💅🏾',
-          '💪🏾',
-          '👂🏾',
-          '👃🏾',
-          '🙅🏾',
-          '🙆🏾',
-          '💁🏾',
-          '🙋🏾',
-          '🙇🏾',
-          '👸🏾',
-          '👰🏾',
-          '👼🏾',
-          '🎅🏾',
-          '💇🏾',
-          '🏃🏾',
-          '💃🏾',
-          '🏄🏾',
-          '👋🏿',
-          '✋🏿',
-          '👌🏿',
-          '✌🏿',
-          '👈🏿',
-          '👉🏿',
-          '👆🏿',
-          '👇🏿',
-          '☝🏿',
-          '👍🏿',
-          '👎🏿',
-          '✊🏿',
-          '👊🏿',
-          '👏🏿',
-          '🙌🏿',
-          '👐🏿',
-          '🙏🏿',
-          '💅🏿',
-          '💪🏿',
-          '👂🏿',
-          '👃🏿',
-          '🙅🏿',
-          '🙆🏿',
-          '💁🏿',
-          '🙋🏿',
-          '🙇🏿',
-          '👸🏿',
-          '👰🏿',
-          '👼🏿',
-          '🎅🏿',
-          '💇🏿',
-          '🏃🏿',
-          '💃🏿',
-          '🏄🏿'
+          '🎌',
+          '🏴',
+          '🏳️',
+          '🏳',
+          '🏳️‍🌈',
+          '🏳‍🌈',
+          '🏴‍☠️',
+          '🏴‍☠',
+          '🇦🇨',
+          '🇦🇩',
+          '🇦🇪',
+          '🇦🇫',
+          '🇦🇬',
+          '🇦🇮',
+          '🇦🇱',
+          '🇦🇲',
+          '🇦🇴',
+          '🇦🇶',
+          '🇦🇷',
+          '🇦🇸',
+          '🇦🇹',
+          '🇦🇺',
+          '🇦🇼',
+          '🇦🇽',
+          '🇦🇿',
+          '🇧🇦',
+          '🇧🇧',
+          '🇧🇩',
+          '🇧🇪',
+          '🇧🇫',
+          '🇧🇬',
+          '🇧🇭',
+          '🇧🇮',
+          '🇧🇯',
+          '🇧🇱',
+          '🇧🇲',
+          '🇧🇳',
+          '🇧🇴',
+          '🇧🇶',
+          '🇧🇷',
+          '🇧🇸',
+          '🇧🇹',
+          '🇧🇻',
+          '🇧🇼',
+          '🇧🇾',
+          '🇧🇿',
+          '🇨🇦',
+          '🇨🇨',
+          '🇨🇩',
+          '🇨🇫',
+          '🇨🇬',
+          '🇨🇭',
+          '🇨🇮',
+          '🇨🇰',
+          '🇨🇱',
+          '🇨🇲',
+          '🇨🇳',
+          '🇨🇴',
+          '🇨🇵',
+          '🇨🇷',
+          '🇨🇺',
+          '🇨🇻',
+          '🇨🇼',
+          '🇨🇽',
+          '🇨🇾',
+          '🇨🇿',
+          '🇩🇪',
+          '🇩🇬',
+          '🇩🇯',
+          '🇩🇰',
+          '🇩🇲',
+          '🇩🇴',
+          '🇩🇿',
+          '🇪🇦',
+          '🇪🇨',
+          '🇪🇪',
+          '🇪🇬',
+          '🇪🇭',
+          '🇪🇷',
+          '🇪🇸',
+          '🇪🇹',
+          '🇪🇺',
+          '🇫🇮',
+          '🇫🇯',
+          '🇫🇰',
+          '🇫🇲',
+          '🇫🇴',
+          '🇫🇷',
+          '🇬🇦',
+          '🇬🇧',
+          '🇬🇩',
+          '🇬🇪',
+          '🇬🇫',
+          '🇬🇬',
+          '🇬🇭',
+          '🇬🇮',
+          '🇬🇱',
+          '🇬🇲',
+          '🇬🇳',
+          '🇬🇵',
+          '🇬🇶',
+          '🇬🇷',
+          '🇬🇸',
+          '🇬🇹',
+          '🇬🇺',
+          '🇬🇼',
+          '🇬🇾',
+          '🇭🇰',
+          '🇭🇲',
+          '🇭🇳',
+          '🇭🇷',
+          '🇭🇹',
+          '🇭🇺',
+          '🇮🇨',
+          '🇮🇩',
+          '🇮🇪',
+          '🇮🇱',
+          '🇮🇲',
+          '🇮🇳',
+          '🇮🇴',
+          '🇮🇶',
+          '🇮🇷',
+          '🇮🇸',
+          '🇮🇹',
+          '🇯🇪',
+          '🇯🇲',
+          '🇯🇴',
+          '🇯🇵',
+          '🇰🇪',
+          '🇰🇬',
+          '🇰🇭',
+          '🇰🇮',
+          '🇰🇲',
+          '🇰🇳',
+          '🇰🇵',
+          '🇰🇷',
+          '🇰🇼',
+          '🇰🇾',
+          '🇰🇿',
+          '🇱🇦',
+          '🇱🇧',
+          '🇱🇨',
+          '🇱🇮',
+          '🇱🇰',
+          '🇱🇷',
+          '🇱🇸',
+          '🇱🇹',
+          '🇱🇺',
+          '🇱🇻',
+          '🇱🇾',
+          '🇲🇦',
+          '🇲🇨',
+          '🇲🇩',
+          '🇲🇪',
+          '🇲🇫',
+          '🇲🇬',
+          '🇲🇭',
+          '🇲🇰',
+          '🇲🇱',
+          '🇲🇲',
+          '🇲🇳',
+          '🇲🇴',
+          '🇲🇵',
+          '🇲🇶',
+          '🇲🇷',
+          '🇲🇸',
+          '🇲🇹',
+          '🇲🇺',
+          '🇲🇻',
+          '🇲🇼',
+          '🇲🇽',
+          '🇲🇾',
+          '🇲🇿',
+          '🇳🇦',
+          '🇳🇨',
+          '🇳🇪',
+          '🇳🇫',
+          '🇳🇬',
+          '🇳🇮',
+          '🇳🇱',
+          '🇳🇴',
+          '🇳🇵',
+          '🇳🇷',
+          '🇳🇺',
+          '🇳🇿',
+          '🇴🇲',
+          '🇵🇦',
+          '🇵🇪',
+          '🇵🇫',
+          '🇵🇬',
+          '🇵🇭',
+          '🇵🇰',
+          '🇵🇱',
+          '🇵🇲',
+          '🇵🇳',
+          '🇵🇷',
+          '🇵🇸',
+          '🇵🇹',
+          '🇵🇼',
+          '🇵🇾',
+          '🇶🇦',
+          '🇷🇪',
+          '🇷🇴',
+          '🇷🇸',
+          '🇷🇺',
+          '🇷🇼',
+          '🇸🇦',
+          '🇸🇧',
+          '🇸🇨',
+          '🇸🇩',
+          '🇸🇪',
+          '🇸🇬',
+          '🇸🇭',
+          '🇸🇮',
+          '🇸🇯',
+          '🇸🇰',
+          '🇸🇱',
+          '🇸🇲',
+          '🇸🇳',
+          '🇸🇴',
+          '🇸🇷',
+          '🇸🇸',
+          '🇸🇹',
+          '🇸🇻',
+          '🇸🇽',
+          '🇸🇾',
+          '🇸🇿',
+          '🇹🇦',
+          '🇹🇨',
+          '🇹🇩',
+          '🇹🇫',
+          '🇹🇬',
+          '🇹🇭',
+          '🇹🇯',
+          '🇹🇰',
+          '🇹🇱',
+          '🇹🇲',
+          '🇹🇳',
+          '🇹🇴',
+          '🇹🇷',
+          '🇹🇹',
+          '🇹🇻',
+          '🇹🇼',
+          '🇹🇿',
+          '🇺🇦',
+          '🇺🇬',
+          '🇺🇲',
+          '🇺🇳',
+          '🇺🇸',
+          '🇺🇾',
+          '🇺🇿',
+          '🇻🇦',
+          '🇻🇨',
+          '🇻🇪',
+          '🇻🇬',
+          '🇻🇮',
+          '🇻🇳',
+          '🇻🇺',
+          '🇼🇫',
+          '🇼🇸',
+          '🇽🇰',
+          '🇾🇪',
+          '🇾🇹',
+          '🇿🇦',
+          '🇿🇲',
+          '🇿🇼',
+          '🏴󠁧󠁢󠁥󠁮󠁧󠁿',
+          '🏴󠁧󠁢󠁳󠁣󠁴󠁿',
+          '🏴󠁧󠁢󠁷󠁬󠁳󠁿'
         ]
       }
     }
diff --git a/crawler/reactions.js b/crawler/reactions.js
index 67abc4bd..b9bdd94f 100644
--- a/crawler/reactions.js
+++ b/crawler/reactions.js
@@ -146,8 +146,6 @@ const listReactions = exports.listReactions = async function (topic) {
         crawl_reactions.topic = ?
   `, [topic])
 
-  console.log(topic, rows)
-
   // construct reactions list
   var reactions = {}
   rows.forEach(row => {
@@ -160,8 +158,6 @@ const listReactions = exports.listReactions = async function (topic) {
     })
   })
 
-  console.log(reactions)
-
   return Object.values(reactions)
 }
 
@@ -175,6 +171,7 @@ const listReactions = exports.listReactions = async function (topic) {
  * @returns {Promise<void>}
  */
 exports.addReaction = async function (archive, topic, emoji) {
+  emoji = emoji.replace('\uFE0F', '').replace('\uFE0E', '') // strip the emoji-enforcement token
   var valid = validateReaction({type: JSON_TYPE, topic, emojis: [emoji]})
   if (!valid) throw ajv.errorsText(validateReaction.errors)
 
@@ -195,6 +192,7 @@ exports.addReaction = async function (archive, topic, emoji) {
  * @returns {Promise<void>}
  */
 exports.deleteReaction = async function (archive, topic, emoji) {
+  emoji = emoji.replace('\uFE0F', '').replace('\uFE0E', '') // strip the emoji-enforcement token
   var valid = validateReaction({type: JSON_TYPE, topic, emojis: [emoji]})
   if (!valid) throw ajv.errorsText(validateReaction.errors)
 

From 3f3151a5cfab43ae9d26d6e5c720db6745922eef Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 19 Apr 2019 14:35:31 -0500
Subject: [PATCH 154/245] Add assets crawler

---
 crawler/assets.js | 123 ++++++++++++++++++++++++++++++++++++++++++++++
 crawler/index.js  |   3 ++
 crawler/posts.js  |   2 +-
 package-lock.json |  55 +++++++++++++++++++++
 package.json      |   1 +
 5 files changed, 183 insertions(+), 1 deletion(-)
 create mode 100644 crawler/assets.js

diff --git a/crawler/assets.js b/crawler/assets.js
new file mode 100644
index 00000000..53d37689
--- /dev/null
+++ b/crawler/assets.js
@@ -0,0 +1,123 @@
+const Events = require('events')
+const ICO = require('icojs')
+const mime = require('mime')
+const logger = require('../logger').child({category: 'crawler', dataset: 'assets'})
+const sitedata = require('../dbs/sitedata')
+const {doCrawl, doCheckpoint, getMatchingChangesInOrder, emitProgressEvent} = require('./util')
+
+// constants
+// =
+
+const TABLE_VERSION = 1
+const ASSET_PATH_REGEX = /^\/(favicon|thumb|cover).(jpg|jpeg|png|ico)$/i
+const IDEAL_FAVICON_SIZE = 64
+
+// typedefs
+// =
+
+/**
+ * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
+ * @typedef {import('./util').CrawlSourceRecord} CrawlSourceRecord
+ */
+
+// globals
+// =
+
+const events = new Events()
+
+// exported api
+// =
+
+exports.on = events.on.bind(events)
+exports.addListener = events.addListener.bind(events)
+exports.removeListener = events.removeListener.bind(events)
+
+/**
+ * @description
+ * Crawl the given site for assets.
+ *
+ * @param {InternalDatArchive} archive - site to crawl.
+ * @param {CrawlSourceRecord} crawlSource - internal metadata about the crawl target.
+ * @returns {Promise<void>}
+ */
+exports.crawlSite = async function (archive, crawlSource) {
+  return doCrawl(archive, crawlSource, 'crawl_assets', TABLE_VERSION, async ({changes, resetRequired}) => {
+    const supressEvents = resetRequired === true // dont emit when replaying old info
+    logger.silly('Crawling assets', {details: {url: archive.url, numChanges: changes.length, resetRequired}})
+    if (resetRequired) {
+      // reset all data
+      logger.debug('Resetting dataset', {details: {url: archive.url}})
+      await doCheckpoint('crawl_assets', TABLE_VERSION, crawlSource, 0)
+    }
+
+    // collect changed assets
+    var changedAssets = getMatchingChangesInOrder(changes, ASSET_PATH_REGEX)
+    if (changedAssets.length) {
+      logger.verbose('Collected new/changed assets', {details: {url: archive.url, changedAssets: changedAssets.map(p => p.name)}})
+    } else {
+      logger.debug('No new assets found', {details: {url: archive.url}})
+    }
+    emitProgressEvent(archive.url, 'crawl_assets', 0, changedAssets.length)
+
+    // read and cache each asset in order
+    var progress = 0
+    for (let changedAsset of changedAssets) {
+      let assetType = extractAssetType(changedAsset.name)
+      if (changedAsset.type === 'del') {
+        // delete
+        await sitedata.clear(archive.url, assetType)
+        events.emit('asset-removed', archive.url)
+      } else {
+        // read and store
+        var dataUrl = await readAsset(archive, changedAsset.name)
+        await sitedata.set(archive.url, assetType, dataUrl)
+        events.emit('asset-updated', archive.url)
+      }
+
+      // checkpoint our progress
+      await doCheckpoint('crawl_assets', TABLE_VERSION, crawlSource, changedAsset.version)
+      emitProgressEvent(archive.url, 'crawl_assets', ++progress, changedAssets.length)
+    }
+    logger.silly(`Finished crawling assets`, {details: {url: archive.url}})
+  })
+}
+
+// internal
+// =
+
+/**
+ * Extract the asset type from the pathname
+ * @param {string} pathname 
+ * @returns string
+ */
+function extractAssetType (pathname) {
+  if (/cover/.test(pathname)) return 'cover'
+  if (/thumb/.test(pathname)) return 'thumb'
+  return 'favicon'
+}
+
+/**
+ * Reads the asset file as a dataurl
+ * - Converts any .ico to .png
+ * @param {InternalDatArchive} archive 
+ * @param {string} pathname 
+ * @returns string The asset as a data URL
+ */
+async function readAsset (archive, pathname) {
+  if (pathname.endsWith('.ico')) {
+    let data = await archive.pda.readFile(pathname, 'binary')
+    // select the best-fitting size
+    let images = await ICO.parse(data, 'image/png')
+    let image = images[0]
+    for (let i = 1; i < images.length; i++) {
+      if (Math.abs(images[i].width - IDEAL_FAVICON_SIZE) < Math.abs(image.width - IDEAL_FAVICON_SIZE)) {
+        image = images[i]
+      }
+    }
+    let buf = Buffer.from(image.buffer)
+    return `data:image/png;base64,${buf.toString('base64')}`
+  } else {
+    let data = await archive.pda.readFile(pathname, 'base64')
+    return `data:${mime.lookup(pathname)};base64,${data}`
+  }
+}
\ No newline at end of file
diff --git a/crawler/index.js b/crawler/index.js
index 52425eb4..54635c00 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -11,6 +11,7 @@ const posts = require('./posts')
 const bookmarks = require('./bookmarks')
 const graph = require('./graph')
 const reactions = require('./reactions')
+const assets = require('./assets')
 const siteDescriptions = require('./site-descriptions')
 
 // globals
@@ -25,6 +26,7 @@ exports.posts = posts
 exports.bookmarks = bookmarks
 exports.graph = graph
 exports.reactions = reactions
+exports.assets = assets
 exports.siteDescriptions = siteDescriptions
 const createEventsStream = exports.createEventsStream = () => emitStream(crawlerEvents)
 
@@ -89,6 +91,7 @@ exports.crawlSite = async function (archive) {
       bookmarks.crawlSite(archive, crawlSource),
       graph.crawlSite(archive, crawlSource),
       reactions.crawlSite(archive, crawlSource),
+      assets.crawlSite(archive, crawlSource),
       siteDescriptions.crawlSite(archive, crawlSource)
     ])
   } catch (err) {
diff --git a/crawler/posts.js b/crawler/posts.js
index c79d6b90..f3e08665 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -137,10 +137,10 @@ exports.crawlSite = async function (archive, crawlSource) {
       }
 
       // checkpoint our progress
-      logger.silly(`Finished crawling posts`, {details: {url: archive.url}})
       await doCheckpoint('crawl_posts', TABLE_VERSION, crawlSource, changedPost.version)
       emitProgressEvent(archive.url, 'crawl_posts', ++progress, changedPosts.length)
     }
+    logger.silly(`Finished crawling posts`, {details: {url: archive.url}})
   })
 }
 
diff --git a/package-lock.json b/package-lock.json
index 7d285eef..3d4911c9 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -425,6 +425,11 @@
       "resolved": "https://registry.npmjs.org/bluebird/-/bluebird-3.5.3.tgz",
       "integrity": "sha512-/qKPUQlaW1OyR51WeCPBvRnAlnZFUJkCSG5HzGnuIqhgyJtF+T94lFnn33eiazjRm2LAHVy2guNnaq48X9SJuw=="
     },
+    "bmp-js": {
+      "version": "0.1.0",
+      "resolved": "https://registry.npmjs.org/bmp-js/-/bmp-js-0.1.0.tgz",
+      "integrity": "sha1-4Fpj95amwf8l9Hcex62twUjAcjM="
+    },
     "brace-expansion": {
       "version": "1.1.11",
       "resolved": "https://registry.npmjs.org/brace-expansion/-/brace-expansion-1.1.11.tgz",
@@ -855,6 +860,23 @@
         }
       }
     },
+    "decode-bmp": {
+      "version": "0.1.0",
+      "resolved": "https://registry.npmjs.org/decode-bmp/-/decode-bmp-0.1.0.tgz",
+      "integrity": "sha512-i7ImaOawHIwQNIt3IpO8X04ZRGI4A7gqX3vPw5aMIqMwsAk5xs/pnWLKmXc97nII5rSGJB9QyauO5FwctFiYoQ==",
+      "requires": {
+        "to-data-view": "^1.0.0"
+      }
+    },
+    "decode-ico": {
+      "version": "0.3.1",
+      "resolved": "https://registry.npmjs.org/decode-ico/-/decode-ico-0.3.1.tgz",
+      "integrity": "sha512-Ejv981YSYeAVyebE+g/Z/3hhE9wLE0uOBmiglqnhRfVMbLu1mf0CCesOoFWjdDqDYBOWIYLHJ6+uQxjlID3FEg==",
+      "requires": {
+        "decode-bmp": "^0.1.0",
+        "to-data-view": "^1.0.0"
+      }
+    },
     "decode-uri-component": {
       "version": "0.2.0",
       "resolved": "https://registry.npmjs.org/decode-uri-component/-/decode-uri-component-0.2.0.tgz",
@@ -1578,6 +1600,11 @@
         "object-assign": "^4.0.1"
       }
     },
+    "file-type": {
+      "version": "10.11.0",
+      "resolved": "https://registry.npmjs.org/file-type/-/file-type-10.11.0.tgz",
+      "integrity": "sha512-uzk64HRpUZyTGZtVuvrjP0FYxzQrBf4rojot6J65YMEbwBLB0CWm0CLojVpwpmFmxcE/lkvYICgfcGozbBq6rw=="
+    },
     "filename-regex": {
       "version": "2.0.1",
       "resolved": "https://registry.npmjs.org/filename-regex/-/filename-regex-2.0.1.tgz",
@@ -2068,6 +2095,19 @@
         }
       }
     },
+    "icojs": {
+      "version": "0.12.3",
+      "resolved": "https://registry.npmjs.org/icojs/-/icojs-0.12.3.tgz",
+      "integrity": "sha512-7c/U6GVyBW6iw7SqmO0XLh2+q+KuaDZ2SoJcG+GrBqjAtvr9e0mtiUOxkpRx7ym6XcZQDvjgc0usjskyROJ+gg==",
+      "requires": {
+        "bmp-js": "0.1.0",
+        "decode-ico": "^0.3.1",
+        "file-type": "^10.7.0",
+        "jpeg-js": "^0.3.3",
+        "pngjs": "^3.3.3",
+        "to-data-view": "^1.0.0"
+      }
+    },
     "iconv-lite": {
       "version": "0.4.24",
       "resolved": "https://registry.npmjs.org/iconv-lite/-/iconv-lite-0.4.24.tgz",
@@ -2414,6 +2454,11 @@
       "resolved": "https://registry.npmjs.org/isstream/-/isstream-0.1.2.tgz",
       "integrity": "sha1-R+Y/evVa+m+S4VAOaQ64uFKcCZo="
     },
+    "jpeg-js": {
+      "version": "0.3.4",
+      "resolved": "https://registry.npmjs.org/jpeg-js/-/jpeg-js-0.3.4.tgz",
+      "integrity": "sha512-6IzjQxvnlT8UlklNmDXIJMWxijULjqGrzgqc0OG7YadZdvm7KPQ1j0ehmQQHckgEWOfgpptzcnWgESovxudpTA=="
+    },
     "js-tokens": {
       "version": "3.0.2",
       "resolved": "https://registry.npmjs.org/js-tokens/-/js-tokens-3.0.2.tgz",
@@ -3483,6 +3528,11 @@
       "integrity": "sha512-ARhBOdzS3e41FbkW/XWrTEtukqqLoK5+Z/4UeDaLuSW+39JPeFgs4gCGqsrJHVZX0fUrx//4OF0K1CUGwlIFow==",
       "dev": true
     },
+    "pngjs": {
+      "version": "3.4.0",
+      "resolved": "https://registry.npmjs.org/pngjs/-/pngjs-3.4.0.tgz",
+      "integrity": "sha512-NCrCHhWmnQklfH4MtJMRjZ2a8c80qXeMlQMv2uVp9ISJMTt562SbGd6n2oq0PaPgKm7Z6pL9E2UlLIhC+SHL3w=="
+    },
     "posix-character-classes": {
       "version": "0.1.1",
       "resolved": "https://registry.npmjs.org/posix-character-classes/-/posix-character-classes-0.1.1.tgz",
@@ -4514,6 +4564,11 @@
       "resolved": "https://registry.npmjs.org/to-buffer/-/to-buffer-1.1.1.tgz",
       "integrity": "sha512-lx9B5iv7msuFYE3dytT+KE5tap+rNYw+K4jVkb9R/asAb+pbBSM17jtunHplhBe6RRJdZx3Pn2Jph24O32mOVg=="
     },
+    "to-data-view": {
+      "version": "1.0.0",
+      "resolved": "https://registry.npmjs.org/to-data-view/-/to-data-view-1.0.0.tgz",
+      "integrity": "sha512-pz/bdULSupr+shtVLFHRBXstHfeBByfT9oa1oVOMBR4FWJkuFuD/OFdXZkR8sWONbtfKO7m3Tin/tKM+k3Qt8Q=="
+    },
     "to-object-path": {
       "version": "0.3.0",
       "resolved": "https://registry.npmjs.org/to-object-path/-/to-object-path-0.3.0.tgz",
diff --git a/package.json b/package.json
index feb3b958..a6791dba 100644
--- a/package.json
+++ b/package.json
@@ -49,6 +49,7 @@
     "hypercore-protocol": "^6.9.0",
     "hyperdrive": "^9.14.3",
     "hyperdrive-network-speed": "^2.1.0",
+    "icojs": "^0.12.3",
     "identify-filetype": "^1.0.0",
     "into-stream": "^3.1.0",
     "knex": "^0.16.3",

From db5ca1b1f3b22eb6ece200e74c7f503e404a53f8 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 19 Apr 2019 14:36:09 -0500
Subject: [PATCH 155/245] Update crawler suggestions hardcoded values

---
 crawler/assets.js | 6 +++---
 crawler/search.js | 3 +--
 2 files changed, 4 insertions(+), 5 deletions(-)

diff --git a/crawler/assets.js b/crawler/assets.js
index 53d37689..7ab820cc 100644
--- a/crawler/assets.js
+++ b/crawler/assets.js
@@ -87,7 +87,7 @@ exports.crawlSite = async function (archive, crawlSource) {
 
 /**
  * Extract the asset type from the pathname
- * @param {string} pathname 
+ * @param {string} pathname
  * @returns string
  */
 function extractAssetType (pathname) {
@@ -99,8 +99,8 @@ function extractAssetType (pathname) {
 /**
  * Reads the asset file as a dataurl
  * - Converts any .ico to .png
- * @param {InternalDatArchive} archive 
- * @param {string} pathname 
+ * @param {InternalDatArchive} archive
+ * @param {string} pathname
  * @returns string The asset as a data URL
  */
 async function readAsset (archive, pathname) {
diff --git a/crawler/search.js b/crawler/search.js
index 75e82b53..257f9fbf 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -11,12 +11,11 @@ const knex = require('../lib/knex')
 
 /** @type {Array<Object>} */
 const BUILTIN_PAGES = [
+  {title: 'Beaker.Social', url: 'dat://beaker.social'},
   {title: 'Address book', url: 'beaker://library/?view=addressbook'},
   {title: 'Bookmarks', url: 'beaker://library/?view=bookmarks'},
   {title: 'Websites', url: 'beaker://library/?view=websites'},
-  {title: 'Search', url: 'beaker://search'},
   {title: 'History', url: 'beaker://history'},
-  {title: 'Watchlist', url: 'beaker://watchlist'},
   {title: 'Downloads', url: 'beaker://downloads'},
   {title: 'Settings', url: 'beaker://settings'},
 ]

From 2ab896161d7a9a08c9fef322f44fbfad8bccd456 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 19 Apr 2019 14:36:34 -0500
Subject: [PATCH 156/245] Only return sites with multiple visits in history
 search

---
 dbs/history.js | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/dbs/history.js b/dbs/history.js
index c689890a..4b70ae57 100644
--- a/dbs/history.js
+++ b/dbs/history.js
@@ -190,7 +190,7 @@ exports.search = async function (q) {
       SELECT offsets(visit_fts) as offsets, visit_fts.url, visit_fts.title, visit_stats.num_visits
         FROM visit_fts
         LEFT JOIN visit_stats ON visit_stats.url = visit_fts.url
-        WHERE visit_fts MATCH ?
+        WHERE visit_fts MATCH ? AND visit_stats.num_visits > 2
         ORDER BY visit_stats.num_visits DESC
         LIMIT 10;
     `, [q])

From 0aeefafe5121997c3eaa52bb840b14d1b699f1e3 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 19 Apr 2019 15:30:28 -0500
Subject: [PATCH 157/245] Move dat asset crawling into the dat codepaths so
 that all loaded dats are cached, not just crawled dats

---
 crawler/assets.js | 123 ----------------------------------------------
 crawler/index.js  |   3 --
 dat/assets.js     |  87 ++++++++++++++++++++++++++++++++
 dat/library.js    |   3 ++
 4 files changed, 90 insertions(+), 126 deletions(-)
 delete mode 100644 crawler/assets.js
 create mode 100644 dat/assets.js

diff --git a/crawler/assets.js b/crawler/assets.js
deleted file mode 100644
index 7ab820cc..00000000
--- a/crawler/assets.js
+++ /dev/null
@@ -1,123 +0,0 @@
-const Events = require('events')
-const ICO = require('icojs')
-const mime = require('mime')
-const logger = require('../logger').child({category: 'crawler', dataset: 'assets'})
-const sitedata = require('../dbs/sitedata')
-const {doCrawl, doCheckpoint, getMatchingChangesInOrder, emitProgressEvent} = require('./util')
-
-// constants
-// =
-
-const TABLE_VERSION = 1
-const ASSET_PATH_REGEX = /^\/(favicon|thumb|cover).(jpg|jpeg|png|ico)$/i
-const IDEAL_FAVICON_SIZE = 64
-
-// typedefs
-// =
-
-/**
- * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
- * @typedef {import('./util').CrawlSourceRecord} CrawlSourceRecord
- */
-
-// globals
-// =
-
-const events = new Events()
-
-// exported api
-// =
-
-exports.on = events.on.bind(events)
-exports.addListener = events.addListener.bind(events)
-exports.removeListener = events.removeListener.bind(events)
-
-/**
- * @description
- * Crawl the given site for assets.
- *
- * @param {InternalDatArchive} archive - site to crawl.
- * @param {CrawlSourceRecord} crawlSource - internal metadata about the crawl target.
- * @returns {Promise<void>}
- */
-exports.crawlSite = async function (archive, crawlSource) {
-  return doCrawl(archive, crawlSource, 'crawl_assets', TABLE_VERSION, async ({changes, resetRequired}) => {
-    const supressEvents = resetRequired === true // dont emit when replaying old info
-    logger.silly('Crawling assets', {details: {url: archive.url, numChanges: changes.length, resetRequired}})
-    if (resetRequired) {
-      // reset all data
-      logger.debug('Resetting dataset', {details: {url: archive.url}})
-      await doCheckpoint('crawl_assets', TABLE_VERSION, crawlSource, 0)
-    }
-
-    // collect changed assets
-    var changedAssets = getMatchingChangesInOrder(changes, ASSET_PATH_REGEX)
-    if (changedAssets.length) {
-      logger.verbose('Collected new/changed assets', {details: {url: archive.url, changedAssets: changedAssets.map(p => p.name)}})
-    } else {
-      logger.debug('No new assets found', {details: {url: archive.url}})
-    }
-    emitProgressEvent(archive.url, 'crawl_assets', 0, changedAssets.length)
-
-    // read and cache each asset in order
-    var progress = 0
-    for (let changedAsset of changedAssets) {
-      let assetType = extractAssetType(changedAsset.name)
-      if (changedAsset.type === 'del') {
-        // delete
-        await sitedata.clear(archive.url, assetType)
-        events.emit('asset-removed', archive.url)
-      } else {
-        // read and store
-        var dataUrl = await readAsset(archive, changedAsset.name)
-        await sitedata.set(archive.url, assetType, dataUrl)
-        events.emit('asset-updated', archive.url)
-      }
-
-      // checkpoint our progress
-      await doCheckpoint('crawl_assets', TABLE_VERSION, crawlSource, changedAsset.version)
-      emitProgressEvent(archive.url, 'crawl_assets', ++progress, changedAssets.length)
-    }
-    logger.silly(`Finished crawling assets`, {details: {url: archive.url}})
-  })
-}
-
-// internal
-// =
-
-/**
- * Extract the asset type from the pathname
- * @param {string} pathname
- * @returns string
- */
-function extractAssetType (pathname) {
-  if (/cover/.test(pathname)) return 'cover'
-  if (/thumb/.test(pathname)) return 'thumb'
-  return 'favicon'
-}
-
-/**
- * Reads the asset file as a dataurl
- * - Converts any .ico to .png
- * @param {InternalDatArchive} archive
- * @param {string} pathname
- * @returns string The asset as a data URL
- */
-async function readAsset (archive, pathname) {
-  if (pathname.endsWith('.ico')) {
-    let data = await archive.pda.readFile(pathname, 'binary')
-    // select the best-fitting size
-    let images = await ICO.parse(data, 'image/png')
-    let image = images[0]
-    for (let i = 1; i < images.length; i++) {
-      if (Math.abs(images[i].width - IDEAL_FAVICON_SIZE) < Math.abs(image.width - IDEAL_FAVICON_SIZE)) {
-        image = images[i]
-      }
-    }
-    let buf = Buffer.from(image.buffer)
-    return `data:image/png;base64,${buf.toString('base64')}`
-  } else {
-    let data = await archive.pda.readFile(pathname, 'base64')
-    return `data:${mime.lookup(pathname)};base64,${data}`
-  }
-}
\ No newline at end of file
diff --git a/crawler/index.js b/crawler/index.js
index 54635c00..52425eb4 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -11,7 +11,6 @@ const posts = require('./posts')
 const bookmarks = require('./bookmarks')
 const graph = require('./graph')
 const reactions = require('./reactions')
-const assets = require('./assets')
 const siteDescriptions = require('./site-descriptions')
 
 // globals
@@ -26,7 +25,6 @@ exports.posts = posts
 exports.bookmarks = bookmarks
 exports.graph = graph
 exports.reactions = reactions
-exports.assets = assets
 exports.siteDescriptions = siteDescriptions
 const createEventsStream = exports.createEventsStream = () => emitStream(crawlerEvents)
 
@@ -91,7 +89,6 @@ exports.crawlSite = async function (archive) {
       bookmarks.crawlSite(archive, crawlSource),
       graph.crawlSite(archive, crawlSource),
       reactions.crawlSite(archive, crawlSource),
-      assets.crawlSite(archive, crawlSource),
       siteDescriptions.crawlSite(archive, crawlSource)
     ])
   } catch (err) {
diff --git a/dat/assets.js b/dat/assets.js
new file mode 100644
index 00000000..dd1ede38
--- /dev/null
+++ b/dat/assets.js
@@ -0,0 +1,87 @@
+const ICO = require('icojs')
+const mime = require('mime')
+const sitedata = require('../dbs/sitedata')
+
+// constants
+// =
+
+const ASSET_PATH_REGEX = /^\/?(favicon|thumb|cover).(jpg|jpeg|png|ico)$/i
+const IDEAL_FAVICON_SIZE = 64
+
+// typedefs
+// =
+
+/**
+ * @typedef {import('./library').InternalDatArchive} InternalDatArchive
+ */
+
+
+// exported api
+// =
+
+/**
+ * @description
+ * Crawl the given site for assets.
+ *
+ * @param {InternalDatArchive} archive - site to crawl.
+ * @param {string[]?} filenames - which files to check.
+ * @returns {Promise<void>}
+ */
+exports.update = async function (archive, filenames = null) {
+  // list target assets
+  if (!filenames) {
+    filenames = await archive.pda.readdir('/')
+  }
+  filenames = filenames.filter(v => ASSET_PATH_REGEX.test(v))
+
+  // read and cache each asset
+  for (let filename of filenames) {
+    try {
+      let assetType = extractAssetType(filename)
+      var dataUrl = await readAsset(archive, filename)
+      await sitedata.set(archive.url, assetType, dataUrl)
+    } catch (e) {
+      console.log('Failed to update asset', filename, e)
+    }
+  }
+}
+
+// internal
+// =
+
+/**
+ * Extract the asset type from the pathname
+ * @param {string} pathname
+ * @returns string
+ */
+function extractAssetType (pathname) {
+  if (/cover/.test(pathname)) return 'cover'
+  if (/thumb/.test(pathname)) return 'thumb'
+  return 'favicon'
+}
+
+/**
+ * Reads the asset file as a dataurl
+ * - Converts any .ico to .png
+ * @param {InternalDatArchive} archive
+ * @param {string} pathname
+ * @returns string The asset as a data URL
+ */
+async function readAsset (archive, pathname) {
+  if (pathname.endsWith('.ico')) {
+    let data = await archive.pda.readFile(pathname, 'binary')
+    // select the best-fitting size
+    let images = await ICO.parse(data, 'image/png')
+    let image = images[0]
+    for (let i = 1; i < images.length; i++) {
+      if (Math.abs(images[i].width - IDEAL_FAVICON_SIZE) < Math.abs(image.width - IDEAL_FAVICON_SIZE)) {
+        image = images[i]
+      }
+    }
+    let buf = Buffer.from(image.buffer)
+    return `data:image/png;base64,${buf.toString('base64')}`
+  } else {
+    let data = await archive.pda.readFile(pathname, 'base64')
+    return `data:${mime.lookup(pathname)};base64,${data}`
+  }
+}
\ No newline at end of file
diff --git a/dat/library.js b/dat/library.js
index e8056c04..acfb6843 100644
--- a/dat/library.js
+++ b/dat/library.js
@@ -16,6 +16,7 @@ const archivesDb = require('../dbs/archives')
 
 // dat modules
 const datGC = require('./garbage-collector')
+const datAssets = require('./assets')
 
 // constants
 // =
@@ -397,6 +398,7 @@ async function loadArchiveInner (key, secretKey, userSettings = null) {
   // update db
   archivesDb.touch(key).catch(err => console.error('Failed to update lastAccessTime for archive', key, err))
   await pullLatestArchiveMeta(archive)
+  datAssets.update(archive)
 
   // wire up events
   archive.pullLatestArchiveMeta = _debounce(opts => pullLatestArchiveMeta(archive, opts), 1e3)
@@ -404,6 +406,7 @@ async function loadArchiveInner (key, secretKey, userSettings = null) {
   archive.fileActStream.on('data', ([event, {path}]) => {
     if (event === 'changed') {
       archive.pullLatestArchiveMeta({updateMTime: true})
+      datAssets.update(archive, [path])
     }
   })
 

From 21225addd9d156e3cacdd4ddb63d3fb93e138aec Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 20 Apr 2019 12:15:21 -0500
Subject: [PATCH 158/245] Reduce crawler suggestions from library sections to
 just the library

---
 crawler/search.js | 4 +---
 dat/assets.js     | 1 -
 2 files changed, 1 insertion(+), 4 deletions(-)

diff --git a/crawler/search.js b/crawler/search.js
index 257f9fbf..9fc2ebbe 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -12,9 +12,7 @@ const knex = require('../lib/knex')
 /** @type {Array<Object>} */
 const BUILTIN_PAGES = [
   {title: 'Beaker.Social', url: 'dat://beaker.social'},
-  {title: 'Address book', url: 'beaker://library/?view=addressbook'},
-  {title: 'Bookmarks', url: 'beaker://library/?view=bookmarks'},
-  {title: 'Websites', url: 'beaker://library/?view=websites'},
+  {title: 'Library', url: 'beaker://library'},
   {title: 'History', url: 'beaker://history'},
   {title: 'Downloads', url: 'beaker://downloads'},
   {title: 'Settings', url: 'beaker://settings'},
diff --git a/dat/assets.js b/dat/assets.js
index dd1ede38..1728768d 100644
--- a/dat/assets.js
+++ b/dat/assets.js
@@ -15,7 +15,6 @@ const IDEAL_FAVICON_SIZE = 64
  * @typedef {import('./library').InternalDatArchive} InternalDatArchive
  */
 
-
 // exported api
 // =
 

From f9d2f788f65cfd641f642101e3a43a17947c39ec Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 20 Apr 2019 12:15:33 -0500
Subject: [PATCH 159/245] Add .record to bookmarks output

---
 web-apis/bg/bookmarks.js | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/web-apis/bg/bookmarks.js b/web-apis/bg/bookmarks.js
index 49551b3c..56de13f5 100644
--- a/web-apis/bg/bookmarks.js
+++ b/web-apis/bg/bookmarks.js
@@ -18,6 +18,8 @@ const _get = require('lodash.get')
  *
  * @typedef {Object} BookmarkPublicAPIRecord
  * @prop {BookmarkAuthorPublicAPIRecord} author
+ * @prop {Object} record
+ * @prop {string} record.url
  * @prop {number} createdAt
  * @prop {string} href
  * @prop {string} title
@@ -230,6 +232,7 @@ async function assertPermission (sender, perm) {
 }
 
 function normalizeInternalBookmark (bookmark, user) {
+  bookmark.record = null
   bookmark.author = user
   bookmark.isOwner = true
   return bookmark
@@ -237,6 +240,7 @@ function normalizeInternalBookmark (bookmark, user) {
 
 function normalizeUWBookmark (uwBookmark, user, pinneds) {
   var bookmark = uwBookmark.content
+  bookmark.record = {url: uwBookmark.author.url + uwBookmark.pathname}
   bookmark.createdAt = uwBookmark.createdAt
   bookmark.isPublic = true
   bookmark.author = uwBookmark.author

From 49992bafd62b6dd2eee0def8d67dea66991c56fc Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 21 Apr 2019 14:14:54 -0500
Subject: [PATCH 160/245] Emit 'user-thumb-changed' event from users api

---
 dat/assets.js  | 11 +++++++++++
 dat/index.js   |  1 +
 users/index.js | 11 +++++++++++
 3 files changed, 23 insertions(+)

diff --git a/dat/assets.js b/dat/assets.js
index 1728768d..13a12ad9 100644
--- a/dat/assets.js
+++ b/dat/assets.js
@@ -1,3 +1,4 @@
+const Events = require('events')
 const ICO = require('icojs')
 const mime = require('mime')
 const sitedata = require('../dbs/sitedata')
@@ -15,9 +16,18 @@ const IDEAL_FAVICON_SIZE = 64
  * @typedef {import('./library').InternalDatArchive} InternalDatArchive
  */
 
+// globals
+// =
+
+var events = new Events()
+
 // exported api
 // =
 
+exports.on = events.on.bind(events)
+exports.addListener = events.addListener.bind(events)
+exports.removeListener = events.removeListener.bind(events)
+
 /**
  * @description
  * Crawl the given site for assets.
@@ -39,6 +49,7 @@ exports.update = async function (archive, filenames = null) {
       let assetType = extractAssetType(filename)
       var dataUrl = await readAsset(archive, filename)
       await sitedata.set(archive.url, assetType, dataUrl)
+      events.emit(`update:${assetType}:${archive.url}`)
     } catch (e) {
       console.log('Failed to update asset', filename, e)
     }
diff --git a/dat/index.js b/dat/index.js
index 7b7ac20a..512518b3 100644
--- a/dat/index.js
+++ b/dat/index.js
@@ -1,4 +1,5 @@
 module.exports = {
+  assets: require('./assets'),
   debug: require('./debugging'),
   dns: require('./dns'),
   garbageCollector: require('./garbage-collector'),
diff --git a/users/index.js b/users/index.js
index 02df9e0f..929a1480 100644
--- a/users/index.js
+++ b/users/index.js
@@ -79,6 +79,7 @@ exports.setup = async function () {
     }
 
     // start any active processes
+    watchThumb(user)
     watchAndSyncBookmarks(user)
   }))
 
@@ -319,6 +320,16 @@ async function validateUserUrl (url) {
   }
 }
 
+/**
+ * @param {Object} user
+ * @returns {void}
+ */
+function watchThumb (user) {
+  dat.assets.on(`update:thumb:${user.archive.url}`, () => {
+    events.emit('user-thumb-changed', {url: user.url})
+  })
+}
+
 /**
  * @param {Object} user
  * @returns {void}

From be2cc2290ccec5a54244ad52f6f7f2e7f0193409 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 22 Apr 2019 09:29:03 -0500
Subject: [PATCH 161/245] Adjust default bookmarks

---
 dbs/schemas/profile-data.sql.js     | 2 +-
 dbs/schemas/profile-data.v24.sql.js | 1 -
 2 files changed, 1 insertion(+), 2 deletions(-)

diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index 203d2284..af6b5b43 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -297,7 +297,7 @@ INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Hashbase', 'ht
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Documentation', 'dat://beakerbrowser.com/docs', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Report an issue', 'https://github.com/beakerbrowser/beaker/issues', 0);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker', 'https://opencollective.com/beaker', 1);
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Address book', 'beaker://library/?view=addressbook', 1);
+INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Library', 'beaker://library/', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker.Social', 'dat://beaker.social', 1);
 
 PRAGMA user_version = 25;
diff --git a/dbs/schemas/profile-data.v24.sql.js b/dbs/schemas/profile-data.v24.sql.js
index 5b2b5daf..bacd4af3 100644
--- a/dbs/schemas/profile-data.v24.sql.js
+++ b/dbs/schemas/profile-data.v24.sql.js
@@ -1,6 +1,5 @@
 module.exports = `
 -- new default bookmarks
-INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Address book', 'beaker://library/?view=addressbook', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker.Social', 'dat://beaker.social', 1);
 
 -- description of the bookmark's content, often pulled from the bookmarked page

From 91a54011e437082c8965b7c87c4c5cdbf98ce5fa Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 24 Apr 2019 10:51:26 -0700
Subject: [PATCH 162/245] Add reactions.query() web api

---
 crawler/posts.js                              |  15 +--
 crawler/reactions.js                          |  62 ++++++++++-
 crawler/util.js                               |   6 +-
 web-apis/bg/unwalled-garden-graph.js          |   2 +
 web-apis/bg/unwalled-garden-posts.js          |   1 +
 web-apis/bg/unwalled-garden-reactions.js      | 104 ++++++++++++++----
 .../external/unwalled-garden-reactions.js     |   1 +
 7 files changed, 152 insertions(+), 39 deletions(-)

diff --git a/crawler/posts.js b/crawler/posts.js
index f3e08665..39c2814f 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -169,7 +169,7 @@ exports.query = async function (opts) {
         assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
         opts.filters.authors = [opts.filters.authors]
       }
-      opts.filters.authors = opts.filters.authors.map(toAuthorOrigin)
+      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
     }
   }
 
@@ -299,19 +299,6 @@ exports.deletePost = async function (archive, pathname) {
 // internal methods
 // =
 
-/**
- * @param {string} url
- * @returns {string}
- */
-function toAuthorOrigin (url) {
-  try {
-    var urlParsed = new URL(url)
-    return urlParsed.protocol + '//' + urlParsed.hostname
-  } catch (e) {
-    throw new Error('Invalid URL: ' + url)
-  }
-}
-
 /**
  * @param {string} origin
  * @param {string} pathname
diff --git a/crawler/reactions.js b/crawler/reactions.js
index b9bdd94f..32c726a3 100644
--- a/crawler/reactions.js
+++ b/crawler/reactions.js
@@ -1,3 +1,4 @@
+const assert = require('assert')
 const {URL} = require('url')
 const Events = require('events')
 const Ajv = require('ajv')
@@ -5,7 +6,8 @@ const logger = require('../logger').child({category: 'crawler', dataset: 'reacti
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
 const lock = require('../lib/lock')
-const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, ensureDirectory, slugifyUrl} = require('./util')
+const knex = require('../lib/knex')
+const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, ensureDirectory, toOrigin, slugifyUrl} = require('./util')
 const reactionSchema = require('./json-schemas/reaction')
 
 // constants
@@ -23,6 +25,13 @@ const JSON_PATH_REGEX = /^\/data\/reactions\/([^/]+)\.json$/i
  * @typedef {import('./util').CrawlSourceRecord} CrawlSourceRecord
  *
  * @typedef {Object} Reaction
+ * @prop {string} topic
+ * @prop {string[]} emojis
+ * @prop {string} author
+ * @prop {string} recordUrl
+ * @prop {number} crawledAt
+ *
+ * @typedef {Object} TopicReactions
  * @prop {string} emoji
  * @prop {string[]} authors
  */
@@ -128,8 +137,57 @@ exports.crawlSite = async function (archive, crawlSource) {
  * @description
  * List crawled reactions.
  *
+ * @param {Object} [opts]
+ * @param {Object} [opts.filters]
+ * @param {string|string[]} [opts.filters.authors]
+ * @param {number} [opts.offset=0]
+ * @param {number} [opts.limit]
+ * @param {boolean} [opts.reverse]
+ * @returns {Promise<Array<Reaction>>}
+ */
+exports.query = async function (opts) {
+  // validate & parse params
+  if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+  if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+  if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+  if (opts && opts.filters) {
+    if ('authors' in opts.filters) {
+      if (Array.isArray(opts.filters.authors)) {
+        assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        opts.filters.authors = [opts.filters.authors]
+      }
+      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+    }
+  }
+
+  // execute query
+  let sql = knex('crawl_reactions')
+    .select('crawl_reactions.*')
+    .select('crawl_sources.url AS author')
+    .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_reactions.crawlSourceId')
+    .orderBy('crawl_reactions.topic', opts.reverse ? 'DESC' : 'ASC')
+  if (opts.limit) sql = sql.limit(opts.limit)
+  if (opts.offset) sql = sql.offset(opts.offset)
+  if (opts && opts.filters && opts.filters.authors) {
+    sql = sql.whereIn('crawl_sources.url', opts.filters.authors)
+  }
+  var rows = await db.all(sql)
+
+  // massage results
+  rows.forEach(row => {
+    row.emojis = row.emojis.split(',')
+  })
+  return rows
+}
+
+/**
+ * @description
+ * List crawled reactions on a topic.
+ *
  * @param {string} url - The URL of the topic
- * @returns {Promise<Reaction[]>}
+ * @returns {Promise<TopicReaction[]>}s
  */
 const listReactions = exports.listReactions = async function (topic) {
   // validate params
diff --git a/crawler/util.js b/crawler/util.js
index f0d62fba..41ab99ae 100644
--- a/crawler/util.js
+++ b/crawler/util.js
@@ -142,14 +142,18 @@ exports.toHostname = function (url) {
 
 /**
  * @param {string} url
+ * @param {boolean?} shouldThrow
  * @returns {string}
  */
 const toOrigin =
-exports.toOrigin = function (url) {
+exports.toOrigin = function (url, shouldThrow = false) {
   try {
     var urlParsed = new URL(url)
     return urlParsed.protocol + '//' + urlParsed.hostname
   } catch (e) {
+    if (shouldThrow) {
+      throw new Error('Invalid URL: ' + url)
+    }
     return null
   }
 }
diff --git a/web-apis/bg/unwalled-garden-graph.js b/web-apis/bg/unwalled-garden-graph.js
index cc3ebc0e..3e0af38c 100644
--- a/web-apis/bg/unwalled-garden-graph.js
+++ b/web-apis/bg/unwalled-garden-graph.js
@@ -34,6 +34,7 @@ module.exports = {
 
     var query = {}
     url = normalizeFollowUrl(url)
+    opts = (opts && typeof opts === 'object') ? opts : {}
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
     if (opts && 'offset' in opts) {
       assert(typeof opts.offset === 'number', 'Offset must be a number')
@@ -70,6 +71,7 @@ module.exports = {
 
     var query = {}
     url = normalizeFollowUrl(url)
+    opts = (opts && typeof opts === 'object') ? opts : {}
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
     if (opts && 'offset' in opts) {
       assert(typeof opts.offset === 'number', 'Offset must be a number')
diff --git a/web-apis/bg/unwalled-garden-posts.js b/web-apis/bg/unwalled-garden-posts.js
index 30f224ee..36ae3861 100644
--- a/web-apis/bg/unwalled-garden-posts.js
+++ b/web-apis/bg/unwalled-garden-posts.js
@@ -51,6 +51,7 @@ module.exports = {
    */
   async query (opts) {
     await assertPermission(this.sender, 'dangerousAppControl')
+    opts = (opts && typeof opts === 'object') ? opts : {}
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
     if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
     if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
diff --git a/web-apis/bg/unwalled-garden-reactions.js b/web-apis/bg/unwalled-garden-reactions.js
index c1a42d7f..5010123d 100644
--- a/web-apis/bg/unwalled-garden-reactions.js
+++ b/web-apis/bg/unwalled-garden-reactions.js
@@ -10,48 +10,65 @@ const siteDescriptionsCrawler = require('../../crawler/site-descriptions')
 // =
 
 /**
+ * @typedef {import('../../crawler/reactions').Reaction} Reaction
+ *
  * @typedef {Object} ReactionAuthorPublicAPIRecord
  * @prop {string} url
  * @prop {string} title
  * @prop {string} description
  * @prop {string[]} type
  *
- * @typedef {Object} ReactionPublicAPIRecord
+ * @typedef {Object} TopicReactionsPublicAPIRecord
  * @prop {string} topic
  * @prop {string} emoji
  * @prop {ReactionAuthorPublicAPIRecord[]} authors
+ *
+ * @typedef {Object} ReactionPublicAPIRecord
+ * @prop {string} topic
+ * @prop {string[]} emojis
+ * @prop {ReactionAuthorPublicAPIRecord} author
+ * @prop {number} crawledAt
+ * @prop {Object} record
+ * @prop {string} record.url
  */
 
 // exported api
 // =
 
-/**
- * @param {string} topic
- * @returns {Promise<ReactionPublicAPIRecord[]>}
- */
-async function innerListReactions (topic) {
-  var reactions = await reactionsCrawler.listReactions(topic)
-  return Promise.all(reactions.map(async (reaction) => ({
-    topic,
-    emoji: reaction.emoji,
-    authors: await Promise.all(reaction.authors.map(async (url) => {
-      var desc = await siteDescriptionsCrawler.getBest({subject: url})
-      return {
-        url: desc.url,
-        title: desc.title,
-        description: desc.description,
-        type: desc.type
+module.exports = {
+  /**
+   * @param {Object} [opts]
+   * @param {Object} [opts.filters]
+   * @param {string|string[]} [opts.filters.authors]
+   * @param {number} [opts.offset=0]
+   * @param {number} [opts.limit]
+   * @param {boolean} [opts.reverse]
+   * @returns {Promise<ReactionPublicAPIRecord[]>}
+   */
+  async query (opts) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    opts = (opts && typeof opts === 'object') ? opts : {}
+    if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+    if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+    if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+    if (opts && opts.filters) {
+      if ('authors' in opts.filters) {
+        if (Array.isArray(opts.filters.authors)) {
+          assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        }
       }
-    }))
-  })))
-}
+    }
+    var reactions = await reactionsCrawler.query(opts)
+    return Promise.all(reactions.map(massageReactionRecord))
+  },
 
-module.exports = {
   innerListReactions,
 
   /**
    * @param {string} topic
-   * @returns {Promise<ReactionPublicAPIRecord[]>}
+   * @returns {Promise<TopicReactionsPublicAPIRecord[]>}
    */
   async listReactions (topic) {
     await assertPermission(this.sender, 'dangerousAppControl')
@@ -116,4 +133,47 @@ function normalizeTopicUrl (url) {
     return (url.protocol + '//' + url.hostname + url.pathname + url.search + url.hash).replace(/([/]$)/g, '')
   } catch (e) {}
   return null
+}
+
+/**
+ * @param {string} topic
+ * @returns {Promise<TopicReactionsPublicAPIRecord[]>}
+ */
+async function innerListReactions (topic) {
+  var reactions = await reactionsCrawler.listReactions(topic)
+  return Promise.all(reactions.map(async (reaction) => ({
+    topic,
+    emoji: reaction.emoji,
+    authors: await Promise.all(reaction.authors.map(async (url) => {
+      var desc = await siteDescriptionsCrawler.getBest({subject: url})
+      return {
+        url: desc.url,
+        title: desc.title,
+        description: desc.description,
+        type: desc.type
+      }
+    }))
+  })))
+}
+
+/**
+ * @param {Reaction} reaction
+ * @returns {Promise<ReactionPublicAPIRecord>}
+ */
+async function massageReactionRecord (reaction) {
+  var desc = await siteDescriptionsCrawler.getBest({subject: reaction.author})
+  return {
+    topic: reaction.topic,
+    emojis: reaction.emojis,
+    crawledAt: reaction.crawledAt,
+    author: {
+      url: desc.url,
+      title: desc.title,
+      description: desc.description,
+      type: desc.type
+    },
+    record: {
+      url: reaction.recordUrl
+    }
+  }
 }
\ No newline at end of file
diff --git a/web-apis/manifests/external/unwalled-garden-reactions.js b/web-apis/manifests/external/unwalled-garden-reactions.js
index ff793f11..8f3fdf2f 100644
--- a/web-apis/manifests/external/unwalled-garden-reactions.js
+++ b/web-apis/manifests/external/unwalled-garden-reactions.js
@@ -1,4 +1,5 @@
 module.exports = {
+  query: 'promise',
   listReactions: 'promise',
   addReaction: 'promise',
   deleteReaction: 'promise'

From 818f9958818f414aafd275b9b16e4c1cbe82fc9e Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 24 Apr 2019 15:04:17 -0700
Subject: [PATCH 163/245] Add graph.query() web api

---
 crawler/graph.js                              | 62 +++++++++++++++++++
 web-apis/bg/unwalled-garden-graph.js          | 43 +++++++++++++
 web-apis/bg/unwalled-garden-posts.js          |  1 -
 .../external/unwalled-garden-graph.js         |  1 +
 4 files changed, 106 insertions(+), 1 deletion(-)

diff --git a/crawler/graph.js b/crawler/graph.js
index b055be9b..3462fdf6 100644
--- a/crawler/graph.js
+++ b/crawler/graph.js
@@ -5,6 +5,7 @@ const {URL} = require('url')
 const Ajv = require('ajv')
 const logger = require('../logger').child({category: 'crawler', dataset: 'graph'})
 const lock = require('../lib/lock')
+const knex = require('../lib/knex')
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
 const siteDescriptions = require('./site-descriptions')
@@ -25,6 +26,12 @@ const JSON_PATH = '/data/follows.json'
  * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
  * @typedef {import('./util').CrawlSourceRecord} CrawlSourceRecord
  * @typedef {import('./site-descriptions').SiteDescription} SiteDescription
+ *
+ * @typedef {Object} GraphLink
+ * @prop {string} type
+ * @prop {SiteDescription} src
+ * @prop {SiteDescription} dst
+ * @prop {number} crawledAt
  */
 
 // globals
@@ -125,6 +132,61 @@ exports.crawlSite = async function (archive, crawlSource) {
   })
 }
 
+/**
+ * @description
+ * List crawled graph links.
+ *
+ * @param {Object} [opts]
+ * @param {Object} [opts.filters]
+ * @param {string|string[]} [opts.filters.authors]
+ * @param {number} [opts.offset=0]
+ * @param {number} [opts.limit]
+ * @param {boolean} [opts.reverse]
+ * @returns {Promise<Array<GraphLink>>}
+ */
+exports.query = async function (opts) {
+  // validate & parse params
+  if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+  if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+  if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+  if (opts && opts.filters) {
+    if ('authors' in opts.filters) {
+      if (Array.isArray(opts.filters.authors)) {
+        assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        opts.filters.authors = [opts.filters.authors]
+      }
+      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+    }
+  }
+
+  // execute query
+  let sql = knex('crawl_graph')
+    .select('crawl_graph.*')
+    .select('crawl_sources.url AS srcUrl')
+    .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_graph.crawlSourceId')
+    .orderBy('crawl_graph.crawledAt', opts.reverse ? 'DESC' : 'ASC')
+  if (opts.limit) sql = sql.limit(opts.limit)
+  if (opts.offset) sql = sql.offset(opts.offset)
+  if (opts && opts.filters && opts.filters.authors) {
+    sql = sql.whereIn('crawl_sources.url', opts.filters.authors)
+  }
+  var rows = await db.all(sql)
+
+  // massage results
+  return Promise.all(rows.map(async (row) => {
+    var src = toOrigin(row.srcUrl)
+    var dst = toOrigin(row.destUrl)
+    return {
+      type: 'unwalled.garden/follows',
+      src: await siteDescriptions.getBest({subject: src}),
+      dst: await siteDescriptions.getBest({subject: dst}),
+      crawledAt: row.crawledAt
+    }
+  }))
+}
+
 /**
  * @description
  * List sites that follow subject.
diff --git a/web-apis/bg/unwalled-garden-graph.js b/web-apis/bg/unwalled-garden-graph.js
index 3e0af38c..c2474952 100644
--- a/web-apis/bg/unwalled-garden-graph.js
+++ b/web-apis/bg/unwalled-garden-graph.js
@@ -14,12 +14,46 @@ const graphCrawler = require('../../crawler/graph')
  * @prop {string} title
  * @prop {string} description
  * @prop {string[]} type
+ *
+ * @typedef {Object} GraphLinkPublicAPIRecord
+ * @prop {string} type
+ * @prop {GraphSitePublicAPIRecord} src
+ * @prop {GraphSitePublicAPIRecord} dst
+ * @prop {number} crawledAt
  */
 
 // exported api
 // =
 
 module.exports = {
+  /**
+   * @param {Object} [opts]
+   * @param {Object} [opts.filters]
+   * @param {string|string[]} [opts.filters.authors]
+   * @param {number} [opts.offset=0]
+   * @param {number} [opts.limit]
+   * @param {boolean} [opts.reverse]
+   * @returns {Promise<GraphLinkPublicAPIRecord[]>}
+   */
+  async query (opts) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    opts = (opts && typeof opts === 'object') ? opts : {}
+    if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+    if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+    if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+    if (opts && opts.filters) {
+      if ('authors' in opts.filters) {
+        if (Array.isArray(opts.filters.authors)) {
+          assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        }
+      }
+    }
+    var links = await graphCrawler.query(opts)
+    return Promise.all(links.map(massageLinkRecord))
+  },
+
   /**
    * @param {string} url
    * @param {Object} [opts]
@@ -173,3 +207,12 @@ function massageSiteRecord (site) {
     type: site.type
   }
 }
+
+function massageLinkRecord (link) {
+  return {
+    type: link.type,
+    src: massageSiteRecord(link.src),
+    dst: massageSiteRecord(link.dst),
+    crawledAt: link.crawledAt
+  }
+}
\ No newline at end of file
diff --git a/web-apis/bg/unwalled-garden-posts.js b/web-apis/bg/unwalled-garden-posts.js
index 36ae3861..78a2c7c9 100644
--- a/web-apis/bg/unwalled-garden-posts.js
+++ b/web-apis/bg/unwalled-garden-posts.js
@@ -39,7 +39,6 @@ const reactionsAPI = require('./unwalled-garden-reactions')
 // =
 
 module.exports = {
-
   /**
    * @param {Object} [opts]
    * @param {Object} [opts.filters]
diff --git a/web-apis/manifests/external/unwalled-garden-graph.js b/web-apis/manifests/external/unwalled-garden-graph.js
index 2cb0fd6d..713a2196 100644
--- a/web-apis/manifests/external/unwalled-garden-graph.js
+++ b/web-apis/manifests/external/unwalled-garden-graph.js
@@ -1,4 +1,5 @@
 module.exports = {
+  query: 'promise',
   listFollowers: 'promise',
   listFollows: 'promise',
   isAFollowingB: 'promise',

From 6bf9c73f6b2896feb828f0e22c63a4ebc3db2699 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 24 Apr 2019 15:57:49 -0700
Subject: [PATCH 164/245] Fix: include record.url in reactions query output

---
 crawler/reactions.js | 1 +
 1 file changed, 1 insertion(+)

diff --git a/crawler/reactions.js b/crawler/reactions.js
index 32c726a3..97a84275 100644
--- a/crawler/reactions.js
+++ b/crawler/reactions.js
@@ -178,6 +178,7 @@ exports.query = async function (opts) {
   // massage results
   rows.forEach(row => {
     row.emojis = row.emojis.split(',')
+    row.recordUrl = row.author + row.pathname
   })
   return rows
 }

From e26ca68d24ee3f2efc7649a033b392532f939665 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 30 Apr 2019 20:54:13 -0500
Subject: [PATCH 165/245] Fix library archives query data munging

---
 dbs/archives.js | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/dbs/archives.js b/dbs/archives.js
index f8b3595a..721ea85c 100644
--- a/dbs/archives.js
+++ b/dbs/archives.js
@@ -216,11 +216,11 @@ exports.query = async function (profileId, query = {}) {
     archive.isOwner = archive.isOwner != 0
     archive.type = archive.type ? archive.type.split(',') : []
     archive.userSettings = {
-      isSaved: archive.isSaved != 0,
-      hidden: archive.hidden != 0,
-      networked: archive.networked != 0,
-      autoDownload: archive.autoDownload != 0,
-      autoUpload: archive.autoUpload != 0,
+      isSaved: archive.isSaved == 1,
+      hidden: archive.hidden == 0,
+      networked: archive.networked == 1,
+      autoDownload: archive.autoDownload == 1,
+      autoUpload: archive.autoUpload == 1,
       expiresAt: archive.expiresAt,
       localSyncPath: archive.localSyncPath,
       previewMode: archive.previewMode == 1

From a194346e46a481a08e84805cd61a53df51bcb93f Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 3 May 2019 19:51:27 -0500
Subject: [PATCH 166/245] Dat protocol now redirects to library or
 beaker.social if no html interface is available

---
 dat/protocol.js | 37 ++++++++++++++-----------------------
 1 file changed, 14 insertions(+), 23 deletions(-)

diff --git a/dat/protocol.js b/dat/protocol.js
index f5985370..f6a3a5ff 100644
--- a/dat/protocol.js
+++ b/dat/protocol.js
@@ -252,31 +252,22 @@ exports.electronHandler = async function (request, respond) {
   if (entry && entry.isDirectory()) {
     cleanup()
 
-    // make sure there's a trailing slash
-    if (!hasTrailingSlash) {
-      return respond({
-        statusCode: 303,
-        headers: {
-          Location: `dat://${urlp.host}${urlp.version ? ('+' + urlp.version) : ''}${urlp.pathname || ''}/${urlp.search || ''}`
-        },
-        data: intoStream('')
-      })
-    }
+    // by default, redirect to the library files view
+    let Location = `beaker://library?view=files&dat=${encodeURIComponent(`dat://${urlp.host}${urlp.version ? ('+' + urlp.version) : ''}`)}&path=${encodeURIComponent(urlp.pathname || '')}`
 
-    let headers = {
-      'Content-Type': 'text/html',
-      'Content-Security-Policy': cspHeader,
-      'Access-Control-Allow-Origin': '*'
-    }
-    if (request.method === 'HEAD') {
-      return respond({statusCode: 204, headers, data: intoStream('')})
-    } else {
-      return respond({
-        statusCode: 200,
-        headers,
-        data: intoStream(await directoryListingPage(checkoutFS, filepath, manifest && manifest.web_root))
-      })
+    // for known types, redirect to their preferred interfaces
+    if (!filepath || filepath === '/') {
+      if (manifest.type && manifest.type.includes('unwalled.garden/person')) {
+        Location = `dat://beaker.social/profile/${encodeURIComponent(`dat://${urlp.host}`)}`
+      }
     }
+
+    // redirect to the library files view
+    return respond({
+      statusCode: 303,
+      headers: {Location},
+      data: intoStream('')
+    })
   }
 
   // handle not found

From 8e8afa787914e174c7ce4b9fa2a26c51c9d52b22 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 13 May 2019 09:28:04 -0500
Subject: [PATCH 167/245] Remove reactions from posts web api

---
 web-apis/bg/unwalled-garden-posts.js | 13 -------------
 1 file changed, 13 deletions(-)

diff --git a/web-apis/bg/unwalled-garden-posts.js b/web-apis/bg/unwalled-garden-posts.js
index 78a2c7c9..bedd1670 100644
--- a/web-apis/bg/unwalled-garden-posts.js
+++ b/web-apis/bg/unwalled-garden-posts.js
@@ -4,7 +4,6 @@ const {URL} = require('url')
 const {PermissionsError} = require('beaker-error-constants')
 const dat = require('../../dat')
 const postsCrawler = require('../../crawler/posts')
-const reactionsAPI = require('./unwalled-garden-reactions')
 
 // typedefs
 // =
@@ -20,15 +19,10 @@ const reactionsAPI = require('./unwalled-garden-reactions')
  * @prop {string} url
  * @prop {string} title
  *
- * @typedef {Object} PostReactionPublicAPIRecord
- * @prop {string} emoji
- * @prop {PostReactionAuthorPublicAPIRecord[]} authors
- *
  * @typedef {Object} PostPublicAPIRecord
  * @prop {string} url
  * @prop {Object} content
  * @prop {string} content.body
- * @prop {PostReactionPublicAPIRecord[]} reactions
  * @prop {number} crawledAt
  * @prop {number} createdAt
  * @prop {number} updatedAt
@@ -184,13 +178,6 @@ async function massagePostRecord (post) {
     content: {
       body: post.content.body
     },
-    reactions: (await reactionsAPI.innerListReactions(url)).map(r => ({
-      emoji: r.emoji,
-      authors: r.authors.map(a => ({
-        url: a.url,
-        title: a.title
-      }))
-    })),
     crawledAt: post.crawledAt,
     createdAt: post.createdAt,
     updatedAt: post.updatedAt,

From d4e9fdaa59dca3a4912c88e7da6ddbf5e23bd65c Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 14 May 2019 11:29:08 -0500
Subject: [PATCH 168/245] Bump hypercore-protocol@6.11.0

---
 package-lock.json | 6 +++---
 package.json      | 2 +-
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/package-lock.json b/package-lock.json
index b2cda645..2fbad7ec 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -2034,9 +2034,9 @@
       }
     },
     "hypercore-protocol": {
-      "version": "6.9.0",
-      "resolved": "https://registry.npmjs.org/hypercore-protocol/-/hypercore-protocol-6.9.0.tgz",
-      "integrity": "sha512-80kUQN6aZhdip4vHRhLyYrJ8Uhj34Xw1RdAtMwQNChoOlnVAvOzVh+ffIs6NiqBF4ExU25ToOvPTaYv+pYZBbg==",
+      "version": "6.11.0",
+      "resolved": "https://registry.npmjs.org/hypercore-protocol/-/hypercore-protocol-6.11.0.tgz",
+      "integrity": "sha512-V/0Vru8gavoO++K2QFOAXu7xgBuXcBAjURQ9BQ48DnQ/p4hK4Jy76ulRnppDHpbDthxRziMWLZfmYXncwD63Aw==",
       "requires": {
         "buffer-alloc-unsafe": "^1.0.0",
         "buffer-from": "^1.0.0",
diff --git a/package.json b/package.json
index 128c1154..e1714fb6 100644
--- a/package.json
+++ b/package.json
@@ -46,7 +46,7 @@
     "fs-jetpack": "^1.3.1",
     "fs-reverse": "0.0.3",
     "function-queue": "0.0.12",
-    "hypercore-protocol": "^6.9.0",
+    "hypercore-protocol": "^6.11.0",
     "hyperdrive": "^9.14.3",
     "hyperdrive-network-speed": "^2.1.0",
     "icojs": "^0.12.3",

From 540ef6ce9a0ea156b23c441db411697f6d24817d Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 14 May 2019 11:36:14 -0500
Subject: [PATCH 169/245] Bump hyperdrive@9.14.5

---
 package-lock.json | 18 +++++++++---------
 package.json      |  2 +-
 2 files changed, 10 insertions(+), 10 deletions(-)

diff --git a/package-lock.json b/package-lock.json
index 2fbad7ec..f436cb8a 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -1569,9 +1569,9 @@
       },
       "dependencies": {
         "node-gyp-build": {
-          "version": "3.8.0",
-          "resolved": "https://registry.npmjs.org/node-gyp-build/-/node-gyp-build-3.8.0.tgz",
-          "integrity": "sha512-bYbpIHyRqZ7sVWXxGpz8QIRug5JZc/hzZH4GbdT9HTZi6WmKCZ8GLvP8OZ9TTiIBvwPFKgtGrlWQSXDAvYdsPw==",
+          "version": "3.9.0",
+          "resolved": "https://registry.npmjs.org/node-gyp-build/-/node-gyp-build-3.9.0.tgz",
+          "integrity": "sha512-zLcTg6P4AbcHPq465ZMFNXx7XpKKJh+7kkN699NiQWisR2uWYOWNWqRHAmbnmKiL4e9aLSlmy5U7rEMUXV59+A==",
           "optional": true
         }
       }
@@ -1971,9 +1971,9 @@
       }
     },
     "hypercore": {
-      "version": "6.25.2",
-      "resolved": "https://registry.npmjs.org/hypercore/-/hypercore-6.25.2.tgz",
-      "integrity": "sha512-l6beYZTbWbbsklFv/YehVPofOM2O7T5e3Zz7V4O93xxXb4JhBQ4z3Kgexzl5B0OkbcsUg/bgqRGdqSAS20VAEg==",
+      "version": "6.26.0",
+      "resolved": "https://registry.npmjs.org/hypercore/-/hypercore-6.26.0.tgz",
+      "integrity": "sha512-su/bucp958SyFWWF5uzeLT05N0k7gTbktvLCo0TaloXWSSs2OiFyj3Ka7v93yaD9u0vBT3i0foPoZnj1yC/dog==",
       "requires": {
         "array-lru": "^1.1.0",
         "atomic-batcher": "^1.0.2",
@@ -2049,9 +2049,9 @@
       }
     },
     "hyperdrive": {
-      "version": "9.14.3",
-      "resolved": "https://registry.npmjs.org/hyperdrive/-/hyperdrive-9.14.3.tgz",
-      "integrity": "sha512-j722JRSwempuD8fn5VPVDHR/NFBFKxUlZ1ZLvTTipVkV70uWC9OyWYBlYqWp/b4ZgZpVhcpfzqzpsL1i/H+pTw==",
+      "version": "9.14.5",
+      "resolved": "https://registry.npmjs.org/hyperdrive/-/hyperdrive-9.14.5.tgz",
+      "integrity": "sha512-uSu6eYprXJhIYaZ7PSODNaozddTrVscZpfkHZwmOg0CKYyX03UovfLyfkhH8/QMew6n0iTg+iiyvp2zhnUapnQ==",
       "requires": {
         "append-tree": "^2.3.5",
         "duplexify": "^3.5.0",
diff --git a/package.json b/package.json
index e1714fb6..bbfba9e2 100644
--- a/package.json
+++ b/package.json
@@ -47,7 +47,7 @@
     "fs-reverse": "0.0.3",
     "function-queue": "0.0.12",
     "hypercore-protocol": "^6.11.0",
-    "hyperdrive": "^9.14.3",
+    "hyperdrive": "^9.14.5",
     "hyperdrive-network-speed": "^2.1.0",
     "icojs": "^0.12.3",
     "identify-filetype": "^1.0.0",

From 2ff6ca5844de6fef0d896c7d4287742cf6ced42d Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 14 May 2019 13:43:44 -0500
Subject: [PATCH 170/245] Bump deps

---
 package-lock.json | 518 ++++++++++++++++++++++++++--------------------
 1 file changed, 288 insertions(+), 230 deletions(-)

diff --git a/package-lock.json b/package-lock.json
index f436cb8a..af08aef9 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -5,12 +5,12 @@
   "requires": true,
   "dependencies": {
     "@babel/polyfill": {
-      "version": "7.2.5",
-      "resolved": "https://registry.npmjs.org/@babel/polyfill/-/polyfill-7.2.5.tgz",
-      "integrity": "sha512-8Y/t3MWThtMLYr0YNC/Q76tqN1w30+b0uQMeFUYauG2UGTR19zyUtFrAzT23zNtBxPp+LbE5E/nwV/q/r3y6ug==",
+      "version": "7.4.4",
+      "resolved": "https://registry.npmjs.org/@babel/polyfill/-/polyfill-7.4.4.tgz",
+      "integrity": "sha512-WlthFLfhQQhh+A2Gn5NSFl0Huxz36x86Jn+E9OW7ibK8edKPq+KLy4apM1yDpQ8kJOVi1OVjpP4vSDLdrI04dg==",
       "requires": {
-        "core-js": "^2.5.7",
-        "regenerator-runtime": "^0.12.0"
+        "core-js": "^2.6.5",
+        "regenerator-runtime": "^0.13.2"
       }
     },
     "@beaker/dat-ephemeral-ext-msg": {
@@ -37,9 +37,9 @@
       "integrity": "sha512-aj2mrBLn5ky0GmAg6IPXrQjnN0iB/ulozuJ+oZdrHRAzRbXjGmu4UXsNCjFvPbSaaPZmniocdOzsM392qLOlmQ=="
     },
     "@types/node": {
-      "version": "10.12.18",
-      "resolved": "https://registry.npmjs.org/@types/node/-/node-10.12.18.tgz",
-      "integrity": "sha512-fh+pAqt4xRzPfqA6eh3Z2y6fyZavRIumvjhaCL753+TVkGKGhpPeyrJG2JftD0T9q4GF00KjefsQ+PQNDdWQaQ==",
+      "version": "12.0.1",
+      "resolved": "https://registry.npmjs.org/@types/node/-/node-12.0.1.tgz",
+      "integrity": "sha512-7sy7DKVJrCTbaAERJZq/CU12bzdmpjRr321/Ne9QmzhB3iZ//L16Cizcni5hHNbANxDbxwMb9EFoWkM8KPkp0A==",
       "optional": true
     },
     "abbrev": {
@@ -55,7 +55,7 @@
     },
     "acorn-jsx": {
       "version": "3.0.1",
-      "resolved": "http://registry.npmjs.org/acorn-jsx/-/acorn-jsx-3.0.1.tgz",
+      "resolved": "https://registry.npmjs.org/acorn-jsx/-/acorn-jsx-3.0.1.tgz",
       "integrity": "sha1-r9+UiPsezvyDSPb7IvRk4ypYs2s=",
       "dev": true,
       "requires": {
@@ -64,7 +64,7 @@
       "dependencies": {
         "acorn": {
           "version": "3.3.0",
-          "resolved": "http://registry.npmjs.org/acorn/-/acorn-3.3.0.tgz",
+          "resolved": "https://registry.npmjs.org/acorn/-/acorn-3.3.0.tgz",
           "integrity": "sha1-ReN/s56No/JbruP/U2niu18iAXo=",
           "dev": true
         }
@@ -88,9 +88,9 @@
       "dev": true
     },
     "ansi-escapes": {
-      "version": "3.1.0",
-      "resolved": "http://registry.npmjs.org/ansi-escapes/-/ansi-escapes-3.1.0.tgz",
-      "integrity": "sha512-UgAb8H9D41AQnu/PbWlCofQVcnV4Gs2bBJi9eZPxfU/hgglFh3SMDMENRIqdr7H6XFnXdoknctFByVsCOotTVw==",
+      "version": "3.2.0",
+      "resolved": "https://registry.npmjs.org/ansi-escapes/-/ansi-escapes-3.2.0.tgz",
+      "integrity": "sha512-cBhpre4ma+U0T1oM5fXg7Dy1Jw7zzwv7lt/GoCpr+hDQJoYnKVPLL4dCvSEFMmQurOQvSrwT7SL/DAlhBI97RQ==",
       "dev": true
     },
     "ansi-regex": {
@@ -266,7 +266,7 @@
       "dependencies": {
         "chalk": {
           "version": "1.1.3",
-          "resolved": "http://registry.npmjs.org/chalk/-/chalk-1.1.3.tgz",
+          "resolved": "https://registry.npmjs.org/chalk/-/chalk-1.1.3.tgz",
           "integrity": "sha1-qBFcVeSnAv5NFQq9OHKCKn4J/Jg=",
           "dev": true,
           "requires": {
@@ -421,9 +421,9 @@
       }
     },
     "bluebird": {
-      "version": "3.5.3",
-      "resolved": "https://registry.npmjs.org/bluebird/-/bluebird-3.5.3.tgz",
-      "integrity": "sha512-/qKPUQlaW1OyR51WeCPBvRnAlnZFUJkCSG5HzGnuIqhgyJtF+T94lFnn33eiazjRm2LAHVy2guNnaq48X9SJuw=="
+      "version": "3.5.4",
+      "resolved": "https://registry.npmjs.org/bluebird/-/bluebird-3.5.4.tgz",
+      "integrity": "sha512-FG+nFEZChJrbQ9tIccIfZJBz3J7mLrAhxakAbnrJWn8d7aKOC+LWifa0G+p4ZqKp4y13T7juYvdhq9NzKdsrjw=="
     },
     "bmp-js": {
       "version": "0.1.0",
@@ -487,7 +487,7 @@
     },
     "buffer-equals": {
       "version": "1.0.4",
-      "resolved": "http://registry.npmjs.org/buffer-equals/-/buffer-equals-1.0.4.tgz",
+      "resolved": "https://registry.npmjs.org/buffer-equals/-/buffer-equals-1.0.4.tgz",
       "integrity": "sha1-A1O1T9B/2VZBcGca5vZrnPENJ/U="
     },
     "buffer-fill": {
@@ -547,7 +547,7 @@
     },
     "callsites": {
       "version": "0.2.0",
-      "resolved": "http://registry.npmjs.org/callsites/-/callsites-0.2.0.tgz",
+      "resolved": "https://registry.npmjs.org/callsites/-/callsites-0.2.0.tgz",
       "integrity": "sha1-r6uWJikQp/M8GaV3WCXGnzTjUMo=",
       "dev": true
     },
@@ -557,9 +557,10 @@
       "integrity": "sha1-G2gcIf+EAzyCZUMJBolCDRhxUdw="
     },
     "chalk": {
-      "version": "2.4.1",
-      "resolved": "https://registry.npmjs.org/chalk/-/chalk-2.4.1.tgz",
-      "integrity": "sha512-ObN6h1v2fTJSmUXoS3nMQ92LbDK9be4TV+6G+omQlGJFdcUX5heKi1LZ1YnRMIgwTLEj3E24bT6tYni50rlCfQ==",
+      "version": "2.4.2",
+      "resolved": "https://registry.npmjs.org/chalk/-/chalk-2.4.2.tgz",
+      "integrity": "sha512-Mti+f9lpJNcwF4tWV8/OrTTtF1gZi+f8FqlyAdouralcFWFQWF2+NgCHShjkCb+IFBLq9buZwE1xckQU4peSuQ==",
+      "dev": true,
       "requires": {
         "ansi-styles": "^3.2.1",
         "escape-string-regexp": "^1.0.5",
@@ -570,6 +571,7 @@
           "version": "3.2.1",
           "resolved": "https://registry.npmjs.org/ansi-styles/-/ansi-styles-3.2.1.tgz",
           "integrity": "sha512-VT0ZI6kZRdTh8YyJw3SMbYm/u+NqfsAxEpWO0Pf9sq8/e94WxxOpPKx9FR1FlyCtOVDNOQ+8ntlqFxiRc+r5qA==",
+          "dev": true,
           "requires": {
             "color-convert": "^1.9.0"
           }
@@ -578,6 +580,7 @@
           "version": "5.5.0",
           "resolved": "https://registry.npmjs.org/supports-color/-/supports-color-5.5.0.tgz",
           "integrity": "sha512-QjVjwdXIt408MIiAqCX4oUKsgU2EqAGzs2Ppkm4aQYbjm+ZEWEcW4SfFNTr4uMNZma0ey4f5lgLrkB0aX0QMow==",
+          "dev": true,
           "requires": {
             "has-flag": "^3.0.0"
           }
@@ -701,6 +704,11 @@
         "simple-swizzle": "^0.2.2"
       }
     },
+    "colorette": {
+      "version": "1.0.7",
+      "resolved": "https://registry.npmjs.org/colorette/-/colorette-1.0.7.tgz",
+      "integrity": "sha512-KeK4klsvAgdODAjFPm6QLzvStizJqlxMBtVo4KQMCgk5tt/tf9rAzxmxLHNRynJg3tJjkKGKbHx3j4HLox27Lw=="
+    },
     "colornames": {
       "version": "1.1.1",
       "resolved": "https://registry.npmjs.org/colornames/-/colornames-1.1.1.tgz",
@@ -712,31 +720,31 @@
       "integrity": "sha512-mmGt/1pZqYRjMxB1axhTo16/snVZ5krrKkcmMeVKxzECMMXoCgnvTPp10QgHfcbQZw8Dq2jMNG6je4JlWU0gWg=="
     },
     "colorspace": {
-      "version": "1.1.1",
-      "resolved": "https://registry.npmjs.org/colorspace/-/colorspace-1.1.1.tgz",
-      "integrity": "sha512-pI3btWyiuz7Ken0BWh9Elzsmv2bM9AhA7psXib4anUXy/orfZ/E0MbQwhSOG/9L8hLlalqrU0UhOuqxW1YjmVw==",
+      "version": "1.1.2",
+      "resolved": "https://registry.npmjs.org/colorspace/-/colorspace-1.1.2.tgz",
+      "integrity": "sha512-vt+OoIP2d76xLhjwbBaucYlNSpPsrJWPlBTtwCpQKIu6/CSMutyzX93O/Do0qzpH3YoHEes8YEFXyZ797rEhzQ==",
       "requires": {
         "color": "3.0.x",
         "text-hex": "1.0.x"
       }
     },
     "combined-stream": {
-      "version": "1.0.7",
-      "resolved": "https://registry.npmjs.org/combined-stream/-/combined-stream-1.0.7.tgz",
-      "integrity": "sha512-brWl9y6vOB1xYPZcpZde3N9zDByXTosAeMDo4p1wzo6UMOX4vumB+TP1RZ76sfE6Md68Q0NJSrE/gbezd4Ul+w==",
+      "version": "1.0.8",
+      "resolved": "https://registry.npmjs.org/combined-stream/-/combined-stream-1.0.8.tgz",
+      "integrity": "sha512-FQN4MRfuJeHf7cBbBMJFXhKSDq+2kAArBlmRBvcvFE5BB1HZKXtSFASDhdlz9zOYwxh8lDdnvmMOe/+5cdoEdg==",
       "requires": {
         "delayed-stream": "~1.0.0"
       }
     },
     "commander": {
-      "version": "2.19.0",
-      "resolved": "https://registry.npmjs.org/commander/-/commander-2.19.0.tgz",
-      "integrity": "sha512-6tvAOO+D6OENvRAh524Dh9jcfKTYDQAqvqezbCW82xj5X0pSrcpxtvRKHLG0yBY6SD7PSDrJaj+0AiOcKVd1Xg=="
+      "version": "2.20.0",
+      "resolved": "https://registry.npmjs.org/commander/-/commander-2.20.0.tgz",
+      "integrity": "sha512-7j2y+40w61zy6YC2iRNpUe/NwhNyoXrYpHMrSunaMG64nRnaf96zO/KMQR4OyN/UnE5KLyEBnKHd4aG3rskjpQ=="
     },
     "component-emitter": {
-      "version": "1.2.1",
-      "resolved": "https://registry.npmjs.org/component-emitter/-/component-emitter-1.2.1.tgz",
-      "integrity": "sha1-E3kY1teCg/ffemt8WmPhQOaUJeY="
+      "version": "1.3.0",
+      "resolved": "https://registry.npmjs.org/component-emitter/-/component-emitter-1.3.0.tgz",
+      "integrity": "sha512-Rd3se6QB+sO1TwqZjscQrurpEPIfO0/yYnSin6Q/rD3mOutHvUrCAhJub3r90uNb+SESBuE0QYoB90YdfatsRg=="
     },
     "concat-map": {
       "version": "0.0.1",
@@ -745,7 +753,7 @@
     },
     "concat-stream": {
       "version": "1.6.2",
-      "resolved": "http://registry.npmjs.org/concat-stream/-/concat-stream-1.6.2.tgz",
+      "resolved": "https://registry.npmjs.org/concat-stream/-/concat-stream-1.6.2.tgz",
       "integrity": "sha512-27HBghJxjiZtIk3Ycvn/4kbJk/1uZuJFfuPEns6LaEvpvG1f0hTea8lilrouyo9mVc2GWdcEZ8OLoGmSADlrCw==",
       "requires": {
         "buffer-from": "^1.0.0",
@@ -839,7 +847,7 @@
     },
     "datland-swarm-defaults": {
       "version": "1.0.2",
-      "resolved": "http://registry.npmjs.org/datland-swarm-defaults/-/datland-swarm-defaults-1.0.2.tgz",
+      "resolved": "https://registry.npmjs.org/datland-swarm-defaults/-/datland-swarm-defaults-1.0.2.tgz",
       "integrity": "sha1-J3uJWjnxqn+WpJWgL7NmKl7Z8uA=",
       "requires": {
         "xtend": "^4.0.1"
@@ -1065,7 +1073,7 @@
     },
     "dns-packet": {
       "version": "4.2.0",
-      "resolved": "http://registry.npmjs.org/dns-packet/-/dns-packet-4.2.0.tgz",
+      "resolved": "https://registry.npmjs.org/dns-packet/-/dns-packet-4.2.0.tgz",
       "integrity": "sha512-bn1AKpfkFbm0MIioOMHZ5qJzl2uypdBwI4nYNsqvhjsegBhcKJUlCrMPWLx6JEezRjxZmxhtIz/FkBEur2l8Cw==",
       "requires": {
         "ip": "^1.1.5",
@@ -1144,13 +1152,13 @@
       "integrity": "sha512-zoB603vQReOFvTg5xMl9I1P2PnHsHQQKTEowsKKD7nseUfJq6UWzK+4YtlWUO1nhiQUxe6XMkk+JleSZD1NZFA=="
     },
     "es6-promise": {
-      "version": "4.2.5",
-      "resolved": "https://registry.npmjs.org/es6-promise/-/es6-promise-4.2.5.tgz",
-      "integrity": "sha512-n6wvpdE43VFtJq+lUDYDBFUwV8TZbuGXLV4D6wKafg13ldznKsyEvatubnmUe31zcvelSzOHF+XbaT+Bl9ObDg=="
+      "version": "4.2.6",
+      "resolved": "https://registry.npmjs.org/es6-promise/-/es6-promise-4.2.6.tgz",
+      "integrity": "sha512-aRVgGdnmW2OiySVPUC9e6m+plolMAJKjZnQlCwNSuK5yQ0JN61DZSO1X1Ufd1foqWRAlig0rhduTCHe7sVtK5Q=="
     },
     "es6-promisify": {
       "version": "5.0.0",
-      "resolved": "http://registry.npmjs.org/es6-promisify/-/es6-promisify-5.0.0.tgz",
+      "resolved": "https://registry.npmjs.org/es6-promisify/-/es6-promisify-5.0.0.tgz",
       "integrity": "sha1-UQnWLz5W6pZ8S2NQWu8IKRyKUgM=",
       "requires": {
         "es6-promise": "^4.0.3"
@@ -1159,11 +1167,12 @@
     "escape-string-regexp": {
       "version": "1.0.5",
       "resolved": "https://registry.npmjs.org/escape-string-regexp/-/escape-string-regexp-1.0.5.tgz",
-      "integrity": "sha1-G2HAViGQqN/2rjuyzwIAyhMLhtQ="
+      "integrity": "sha1-G2HAViGQqN/2rjuyzwIAyhMLhtQ=",
+      "dev": true
     },
     "eslint": {
       "version": "4.19.1",
-      "resolved": "http://registry.npmjs.org/eslint/-/eslint-4.19.1.tgz",
+      "resolved": "https://registry.npmjs.org/eslint/-/eslint-4.19.1.tgz",
       "integrity": "sha512-bT3/1x1EbZB7phzYu7vCr1v3ONuzDtX8WjuM9c0iYxe+cq+pwcKEoQjl7zd3RpC6YOLgnSy3cTN58M2jcoPDIQ==",
       "dev": true,
       "requires": {
@@ -1247,7 +1256,7 @@
         },
         "fast-deep-equal": {
           "version": "1.1.0",
-          "resolved": "http://registry.npmjs.org/fast-deep-equal/-/fast-deep-equal-1.1.0.tgz",
+          "resolved": "https://registry.npmjs.org/fast-deep-equal/-/fast-deep-equal-1.1.0.tgz",
           "integrity": "sha1-wFNHeBfIa1HaqFPIHgWbcz0CNhQ=",
           "dev": true
         },
@@ -1286,7 +1295,7 @@
     },
     "espree": {
       "version": "3.5.4",
-      "resolved": "http://registry.npmjs.org/espree/-/espree-3.5.4.tgz",
+      "resolved": "https://registry.npmjs.org/espree/-/espree-3.5.4.tgz",
       "integrity": "sha512-yAcIQxtmMiB/jL32dzEp2enBeidsB7xWPLNiw3IIkpVds1P+h7qF9YwJq1yUNzp2OKXgAprs4F61ih66UsoD1A==",
       "dev": true,
       "requires": {
@@ -1378,7 +1387,7 @@
     },
     "expand-range": {
       "version": "1.8.2",
-      "resolved": "http://registry.npmjs.org/expand-range/-/expand-range-1.8.2.tgz",
+      "resolved": "https://registry.npmjs.org/expand-range/-/expand-range-1.8.2.tgz",
       "integrity": "sha1-opnv/TNf4nIeuujiV+x5ZE/IUzc=",
       "requires": {
         "fill-range": "^2.1.0"
@@ -1456,7 +1465,7 @@
     },
     "external-editor": {
       "version": "2.2.0",
-      "resolved": "http://registry.npmjs.org/external-editor/-/external-editor-2.2.0.tgz",
+      "resolved": "https://registry.npmjs.org/external-editor/-/external-editor-2.2.0.tgz",
       "integrity": "sha512-bSn6gvGxKt+b7+6TKEv1ZycHleA7aHhRHyAqJyp5pbUFuYYNIzpZnQDk7AsYckyWdEnTeAnay0aCy2aV6iTk9A==",
       "dev": true,
       "requires": {
@@ -1566,14 +1575,6 @@
       "requires": {
         "napi-macros": "^1.8.2",
         "node-gyp-build": "^3.8.0"
-      },
-      "dependencies": {
-        "node-gyp-build": {
-          "version": "3.9.0",
-          "resolved": "https://registry.npmjs.org/node-gyp-build/-/node-gyp-build-3.9.0.tgz",
-          "integrity": "sha512-zLcTg6P4AbcHPq465ZMFNXx7XpKKJh+7kkN699NiQWisR2uWYOWNWqRHAmbnmKiL4e9aLSlmy5U7rEMUXV59+A==",
-          "optional": true
-        }
       }
     },
     "fecha": {
@@ -1632,35 +1633,20 @@
       }
     },
     "findup-sync": {
-      "version": "2.0.0",
-      "resolved": "https://registry.npmjs.org/findup-sync/-/findup-sync-2.0.0.tgz",
-      "integrity": "sha1-kyaxSIwi0aYIhlCoaQGy2akKLLw=",
+      "version": "3.0.0",
+      "resolved": "https://registry.npmjs.org/findup-sync/-/findup-sync-3.0.0.tgz",
+      "integrity": "sha512-YbffarhcicEhOrm4CtrwdKBdCuz576RLdhJDsIfvNtxUuhdRet1qZcsMjqbePtAseKdAnDyM/IyXbu7PRPRLYg==",
       "requires": {
         "detect-file": "^1.0.0",
-        "is-glob": "^3.1.0",
+        "is-glob": "^4.0.0",
         "micromatch": "^3.0.4",
         "resolve-dir": "^1.0.1"
-      },
-      "dependencies": {
-        "is-extglob": {
-          "version": "2.1.1",
-          "resolved": "https://registry.npmjs.org/is-extglob/-/is-extglob-2.1.1.tgz",
-          "integrity": "sha1-qIwCU1eR8C7TfHahueqXc8gz+MI="
-        },
-        "is-glob": {
-          "version": "3.1.0",
-          "resolved": "https://registry.npmjs.org/is-glob/-/is-glob-3.1.0.tgz",
-          "integrity": "sha1-e6WuJCF4BKxwcHuWkiVnSGzD6Eo=",
-          "requires": {
-            "is-extglob": "^2.1.0"
-          }
-        }
       }
     },
     "fined": {
-      "version": "1.1.1",
-      "resolved": "https://registry.npmjs.org/fined/-/fined-1.1.1.tgz",
-      "integrity": "sha512-jQp949ZmEbiYHk3gkbdtpJ0G1+kgtLQBNdP5edFP7Fh+WAYceLQz6yO1SBj72Xkg8GVyTB3bBzAYrHJVh5Xd5g==",
+      "version": "1.2.0",
+      "resolved": "https://registry.npmjs.org/fined/-/fined-1.2.0.tgz",
+      "integrity": "sha512-ZYDqPLGxDkDhDZBjZBb+oD1+j0rA4E0pXY50eplAAOPg2N/gUBSSk5IM1/QhPfyVo19lJ+CvXpqfvk+b2p/8Ng==",
       "requires": {
         "expand-tilde": "^2.0.2",
         "is-plain-object": "^2.0.3",
@@ -1697,9 +1683,9 @@
       "integrity": "sha1-gQaNKVqBQuwKxybG4iAMMPttXoA="
     },
     "for-own": {
-      "version": "0.1.5",
-      "resolved": "https://registry.npmjs.org/for-own/-/for-own-0.1.5.tgz",
-      "integrity": "sha1-UmXGgaTylNq78XyVCbZ2OqhFEM4=",
+      "version": "1.0.0",
+      "resolved": "https://registry.npmjs.org/for-own/-/for-own-1.0.0.tgz",
+      "integrity": "sha1-xjMy9BXO3EsE2/5wz4NklMU8tEs=",
       "requires": {
         "for-in": "^1.0.1"
       }
@@ -1819,6 +1805,11 @@
       "resolved": "https://registry.npmjs.org/get-value/-/get-value-2.0.6.tgz",
       "integrity": "sha1-3BXKHGcjh8p2vTesCjlbogQqLCg="
     },
+    "getopts": {
+      "version": "2.2.3",
+      "resolved": "https://registry.npmjs.org/getopts/-/getopts-2.2.3.tgz",
+      "integrity": "sha512-viEcb8TpgeG05+Nqo5EzZ8QR0hxdyrYDp6ZSTZqe2M/h53Bk036NmqG38Vhf5RGirC/Of9Xql+v66B2gp256SQ=="
+    },
     "getpass": {
       "version": "0.1.7",
       "resolved": "https://registry.npmjs.org/getpass/-/getpass-0.1.7.tgz",
@@ -1828,9 +1819,9 @@
       }
     },
     "glob": {
-      "version": "7.1.3",
-      "resolved": "https://registry.npmjs.org/glob/-/glob-7.1.3.tgz",
-      "integrity": "sha512-vcfuiIxogLV4DlGBHIUOwI0IbrJ8HWPc4MU7HzviGeNho/UJDfi6B5p3sHeWIQ0KGIU0Jpxi5ZHxemQfLkkAwQ==",
+      "version": "7.1.4",
+      "resolved": "https://registry.npmjs.org/glob/-/glob-7.1.4.tgz",
+      "integrity": "sha512-hkLPepehmnKk41pUGm3sYxoFs/umurYfYJCerbXEyFIWcAzvpipAgVkBqqT9RBKMGjnq6kMuyYwha6csxbiM1A==",
       "requires": {
         "fs.realpath": "^1.0.0",
         "inflight": "^1.0.4",
@@ -1847,6 +1838,21 @@
       "requires": {
         "glob-parent": "^2.0.0",
         "is-glob": "^2.0.0"
+      },
+      "dependencies": {
+        "is-extglob": {
+          "version": "1.0.0",
+          "resolved": "https://registry.npmjs.org/is-extglob/-/is-extglob-1.0.0.tgz",
+          "integrity": "sha1-rEaBd8SUNAWgkvyPKXYMb/xiBsA="
+        },
+        "is-glob": {
+          "version": "2.0.1",
+          "resolved": "https://registry.npmjs.org/is-glob/-/is-glob-2.0.1.tgz",
+          "integrity": "sha1-0Jb5JqPe1WAPP9/ZEZjLCIjC2GM=",
+          "requires": {
+            "is-extglob": "^1.0.0"
+          }
+        }
       }
     },
     "glob-parent": {
@@ -1855,6 +1861,21 @@
       "integrity": "sha1-gTg9ctsFT8zPUzbaqQLxgvbtuyg=",
       "requires": {
         "is-glob": "^2.0.0"
+      },
+      "dependencies": {
+        "is-extglob": {
+          "version": "1.0.0",
+          "resolved": "https://registry.npmjs.org/is-extglob/-/is-extglob-1.0.0.tgz",
+          "integrity": "sha1-rEaBd8SUNAWgkvyPKXYMb/xiBsA="
+        },
+        "is-glob": {
+          "version": "2.0.1",
+          "resolved": "https://registry.npmjs.org/is-glob/-/is-glob-2.0.1.tgz",
+          "integrity": "sha1-0Jb5JqPe1WAPP9/ZEZjLCIjC2GM=",
+          "requires": {
+            "is-extglob": "^1.0.0"
+          }
+        }
       }
     },
     "global-modules": {
@@ -1880,9 +1901,9 @@
       }
     },
     "globals": {
-      "version": "11.9.0",
-      "resolved": "https://registry.npmjs.org/globals/-/globals-11.9.0.tgz",
-      "integrity": "sha512-5cJVtyXWH8PiJPVLZzzoIizXx944O4OmRro5MWKx5fT4MgcN7OfaMutPeaTdJCCURwbWdhhcCWcKIffPnmTzBg==",
+      "version": "11.12.0",
+      "resolved": "https://registry.npmjs.org/globals/-/globals-11.12.0.tgz",
+      "integrity": "sha512-WOBp/EEGUiIsJSp7wcv/y6MO+lV9UoncWqxuFfm8eBwzWNgyfBd6Gz+IeKQ9jCmyhoH99g15M3T+QaVHFjizVA==",
       "dev": true
     },
     "graceful-fs": {
@@ -1916,7 +1937,8 @@
     "has-flag": {
       "version": "3.0.0",
       "resolved": "https://registry.npmjs.org/has-flag/-/has-flag-3.0.0.tgz",
-      "integrity": "sha1-tdRU3CGZriJWmfNGfloH87lVuv0="
+      "integrity": "sha1-tdRU3CGZriJWmfNGfloH87lVuv0=",
+      "dev": true
     },
     "has-unicode": {
       "version": "2.0.1",
@@ -2227,7 +2249,7 @@
     },
     "into-stream": {
       "version": "3.1.0",
-      "resolved": "http://registry.npmjs.org/into-stream/-/into-stream-3.1.0.tgz",
+      "resolved": "https://registry.npmjs.org/into-stream/-/into-stream-3.1.0.tgz",
       "integrity": "sha1-lvsKk2wSur1v8XUqF9BWFqvQlMY=",
       "requires": {
         "from2": "^2.1.1",
@@ -2255,7 +2277,7 @@
     },
     "is-accessor-descriptor": {
       "version": "0.1.6",
-      "resolved": "http://registry.npmjs.org/is-accessor-descriptor/-/is-accessor-descriptor-0.1.6.tgz",
+      "resolved": "https://registry.npmjs.org/is-accessor-descriptor/-/is-accessor-descriptor-0.1.6.tgz",
       "integrity": "sha1-qeEss66Nh2cn7u84Q/igiXtcmNY=",
       "requires": {
         "kind-of": "^3.0.2"
@@ -2283,7 +2305,7 @@
     },
     "is-data-descriptor": {
       "version": "0.1.4",
-      "resolved": "http://registry.npmjs.org/is-data-descriptor/-/is-data-descriptor-0.1.4.tgz",
+      "resolved": "https://registry.npmjs.org/is-data-descriptor/-/is-data-descriptor-0.1.4.tgz",
       "integrity": "sha1-C17mSDiOLIYCgueT8YVv7D8wG1Y=",
       "requires": {
         "kind-of": "^3.0.2"
@@ -2335,9 +2357,9 @@
       "integrity": "sha1-YrEQ4omkcUGOPsNqYX1HLjAd/Ik="
     },
     "is-extglob": {
-      "version": "1.0.0",
-      "resolved": "https://registry.npmjs.org/is-extglob/-/is-extglob-1.0.0.tgz",
-      "integrity": "sha1-rEaBd8SUNAWgkvyPKXYMb/xiBsA="
+      "version": "2.1.1",
+      "resolved": "https://registry.npmjs.org/is-extglob/-/is-extglob-2.1.1.tgz",
+      "integrity": "sha1-qIwCU1eR8C7TfHahueqXc8gz+MI="
     },
     "is-fullwidth-code-point": {
       "version": "1.0.0",
@@ -2348,11 +2370,11 @@
       }
     },
     "is-glob": {
-      "version": "2.0.1",
-      "resolved": "https://registry.npmjs.org/is-glob/-/is-glob-2.0.1.tgz",
-      "integrity": "sha1-0Jb5JqPe1WAPP9/ZEZjLCIjC2GM=",
+      "version": "4.0.1",
+      "resolved": "https://registry.npmjs.org/is-glob/-/is-glob-4.0.1.tgz",
+      "integrity": "sha512-5G0tKtBTFImOqDnLB2hG6Bp2qcKEFduo4tZu9MT/H6NQv/ghhy30o55ufafxJ/LdH79LLs2Kfrn85TLKyA7BUg==",
       "requires": {
-        "is-extglob": "^1.0.0"
+        "is-extglob": "^2.1.1"
       }
     },
     "is-number": {
@@ -2455,9 +2477,9 @@
       "integrity": "sha1-R+Y/evVa+m+S4VAOaQ64uFKcCZo="
     },
     "jpeg-js": {
-      "version": "0.3.4",
-      "resolved": "https://registry.npmjs.org/jpeg-js/-/jpeg-js-0.3.4.tgz",
-      "integrity": "sha512-6IzjQxvnlT8UlklNmDXIJMWxijULjqGrzgqc0OG7YadZdvm7KPQ1j0ehmQQHckgEWOfgpptzcnWgESovxudpTA=="
+      "version": "0.3.5",
+      "resolved": "https://registry.npmjs.org/jpeg-js/-/jpeg-js-0.3.5.tgz",
+      "integrity": "sha512-hvaExqwmQDS8O9qnZAVDXGWU43Tbu1V0wMZmjROjT11jloSgGICZpscG+P6Nyi1BVAvyu2ARRx8qmEW30sxgdQ=="
     },
     "js-tokens": {
       "version": "3.0.2",
@@ -2466,9 +2488,9 @@
       "dev": true
     },
     "js-yaml": {
-      "version": "3.12.0",
-      "resolved": "https://registry.npmjs.org/js-yaml/-/js-yaml-3.12.0.tgz",
-      "integrity": "sha512-PIt2cnwmPfL4hKNwqeiuz4bKfnzHTBv6HyVgjahA6mPLwPDzjDWrplJBMjHUFxku/N3FlmrbyPclad+I+4mJ3A==",
+      "version": "3.13.1",
+      "resolved": "https://registry.npmjs.org/js-yaml/-/js-yaml-3.13.1.tgz",
+      "integrity": "sha512-YfbcO7jXDdyj0DGxYVSlSeQNHbD7XPWvrVWeVUujrQEoZzWJIRrCPoyk6kL6IAjAG2IolMK4T0hNUe0HOUs5Jw==",
       "dev": true,
       "requires": {
         "argparse": "^1.0.7",
@@ -2579,33 +2601,33 @@
       "integrity": "sha512-s5kLOcnH0XqDO+FvuaLX8DDjZ18CGFk7VygH40QoKPUQhW4e2rvM0rwUq0t8IQDOwYSeLK01U90OjzBTme2QqA=="
     },
     "knex": {
-      "version": "0.16.3",
-      "resolved": "https://registry.npmjs.org/knex/-/knex-0.16.3.tgz",
-      "integrity": "sha512-jGTOBW8b7exaBPfCKJSlv5q320IvWw9hEdtnURtbb0k3HusfZrR4UYiEewem8Nl7VqJILoCj99SjCK3W54UNPg==",
-      "requires": {
-        "@babel/polyfill": "^7.0.0",
-        "@types/bluebird": "^3.5.25",
-        "bluebird": "^3.5.3",
-        "chalk": "2.4.1",
-        "commander": "^2.19.0",
-        "debug": "4.1.0",
+      "version": "0.16.5",
+      "resolved": "https://registry.npmjs.org/knex/-/knex-0.16.5.tgz",
+      "integrity": "sha512-1RVxMU8zGOBqgmXlAvs8vohg9MD14iiRZZPe0IeQXd554n4xxPmoMkbH4hlFeqfM6eOdFE3AVqVSncL3YuocqA==",
+      "requires": {
+        "@babel/polyfill": "^7.4.3",
+        "@types/bluebird": "^3.5.26",
+        "bluebird": "^3.5.4",
+        "colorette": "1.0.7",
+        "commander": "^2.20.0",
+        "debug": "4.1.1",
+        "getopts": "2.2.3",
         "inherits": "~2.0.3",
-        "interpret": "^1.1.0",
-        "liftoff": "2.5.0",
+        "interpret": "^1.2.0",
+        "liftoff": "3.1.0",
         "lodash": "^4.17.11",
-        "minimist": "1.2.0",
         "mkdirp": "^0.5.1",
         "pg-connection-string": "2.0.0",
-        "tarn": "^1.1.4",
+        "tarn": "^1.1.5",
         "tildify": "1.2.0",
         "uuid": "^3.3.2",
-        "v8flags": "^3.1.1"
+        "v8flags": "^3.1.2"
       },
       "dependencies": {
         "debug": {
-          "version": "4.1.0",
-          "resolved": "https://registry.npmjs.org/debug/-/debug-4.1.0.tgz",
-          "integrity": "sha512-heNPJUJIqC+xB6ayLAMHaIrmN9HKa7aQO8MGqKpvCA+uJYVcvR6l5kgdrhRuwPFHU7P5/A1w0BjByPHwpfTDKg==",
+          "version": "4.1.1",
+          "resolved": "https://registry.npmjs.org/debug/-/debug-4.1.1.tgz",
+          "integrity": "sha512-pYAIzeRo8J6KPEaJ0VWOh5Pzkbw/RetuzehGM7QRRX5he4fPHx2rdKMB256ehJCkX+XRQm16eZLqLNS8RSZXZw==",
           "requires": {
             "ms": "^2.1.1"
           }
@@ -2659,12 +2681,12 @@
       }
     },
     "liftoff": {
-      "version": "2.5.0",
-      "resolved": "https://registry.npmjs.org/liftoff/-/liftoff-2.5.0.tgz",
-      "integrity": "sha1-IAkpG7Mc6oYbvxCnwVooyvdcMew=",
+      "version": "3.1.0",
+      "resolved": "https://registry.npmjs.org/liftoff/-/liftoff-3.1.0.tgz",
+      "integrity": "sha512-DlIPlJUkCV0Ips2zf2pJP0unEoT1kwYhiiPUGF3s/jtxTCjziNLoiVVh+jqWOWeFi6mmwQ5fNxvAUyPad4Dfog==",
       "requires": {
         "extend": "^3.0.0",
-        "findup-sync": "^2.0.0",
+        "findup-sync": "^3.0.0",
         "fined": "^1.0.1",
         "flagged-respawn": "^1.0.0",
         "is-plain-object": "^2.0.4",
@@ -2674,9 +2696,9 @@
       }
     },
     "limiter": {
-      "version": "1.1.3",
-      "resolved": "https://registry.npmjs.org/limiter/-/limiter-1.1.3.tgz",
-      "integrity": "sha512-zrycnIMsLw/3ZxTbW7HCez56rcFGecWTx5OZNplzcXUUmJLmoYArC6qdJzmAN5BWiNXGcpjhF9RQ1HSv5zebEw=="
+      "version": "1.1.4",
+      "resolved": "https://registry.npmjs.org/limiter/-/limiter-1.1.4.tgz",
+      "integrity": "sha512-XCpr5bElgDI65vVgstP8TWjv6/QKWm9GU5UG0Pr5sLQ3QLo8NVKsioe+Jed5/3vFOe3IQuqE7DKwTvKQkjTHvg=="
     },
     "linkify-it": {
       "version": "2.1.0",
@@ -2821,13 +2843,20 @@
       "integrity": "sha1-/oWy7HWlkDfyrf7BAP1sYBdhFS4="
     },
     "mem": {
-      "version": "4.0.0",
-      "resolved": "https://registry.npmjs.org/mem/-/mem-4.0.0.tgz",
-      "integrity": "sha512-WQxG/5xYc3tMbYLXoXPm81ET2WDULiU5FxbuIoNbJqLOOI8zehXFdZuiUEgfdrU2mVB1pxBZUGlYORSrpuJreA==",
+      "version": "4.3.0",
+      "resolved": "https://registry.npmjs.org/mem/-/mem-4.3.0.tgz",
+      "integrity": "sha512-qX2bG48pTqYRVmDB37rn/6PT7LcR8T7oAX3bf99u1Tt1nzxYfxkgqDwUwolPlXweM0XzBOBFzSx4kfp7KP1s/w==",
       "requires": {
         "map-age-cleaner": "^0.1.1",
-        "mimic-fn": "^1.0.0",
-        "p-is-promise": "^1.1.0"
+        "mimic-fn": "^2.0.0",
+        "p-is-promise": "^2.0.0"
+      },
+      "dependencies": {
+        "p-is-promise": {
+          "version": "2.1.0",
+          "resolved": "https://registry.npmjs.org/p-is-promise/-/p-is-promise-2.1.0.tgz",
+          "integrity": "sha512-Y3W0wlRPK8ZMRbNq97l4M5otioeA5lm1z7bkNkxCka8HSPjR0xRWmpCmc9utiaLP9Jb1eD8BgeIxTW4AIF45Pg=="
+        }
       }
     },
     "memory-pager": {
@@ -2870,22 +2899,22 @@
       "integrity": "sha512-x0Vn8spI+wuJ1O6S7gnbaQg8Pxh4NNHb7KSINmEWKiPE4RKOplvijn+NkmYmmRgP68mc70j2EbeTFRsrswaQeg=="
     },
     "mime-db": {
-      "version": "1.38.0",
-      "resolved": "https://registry.npmjs.org/mime-db/-/mime-db-1.38.0.tgz",
-      "integrity": "sha512-bqVioMFFzc2awcdJZIzR3HjZFX20QhilVS7hytkKrv7xFAn8bM1gzc/FOX2awLISvWe0PV8ptFKcon+wZ5qYkg=="
+      "version": "1.40.0",
+      "resolved": "https://registry.npmjs.org/mime-db/-/mime-db-1.40.0.tgz",
+      "integrity": "sha512-jYdeOMPy9vnxEqFRRo6ZvTZ8d9oPb+k18PKoYNYUe2stVEBPPwsln/qWzdbmaIvnhZ9v2P+CuecK+fpUfsV2mA=="
     },
     "mime-types": {
-      "version": "2.1.22",
-      "resolved": "https://registry.npmjs.org/mime-types/-/mime-types-2.1.22.tgz",
-      "integrity": "sha512-aGl6TZGnhm/li6F7yx82bJiBZwgiEa4Hf6CNr8YO+r5UHr53tSTYZb102zyU50DOWWKeOv0uQLRL0/9EiKWCog==",
+      "version": "2.1.24",
+      "resolved": "https://registry.npmjs.org/mime-types/-/mime-types-2.1.24.tgz",
+      "integrity": "sha512-WaFHS3MCl5fapm3oLxU4eYDw77IQM2ACcxQ9RIxfaC3ooc6PFuBMGZZsYpvoXS5D5QTWPieo1jjLdAm3TBP3cQ==",
       "requires": {
-        "mime-db": "~1.38.0"
+        "mime-db": "1.40.0"
       }
     },
     "mimic-fn": {
-      "version": "1.2.0",
-      "resolved": "https://registry.npmjs.org/mimic-fn/-/mimic-fn-1.2.0.tgz",
-      "integrity": "sha512-jf84uxzwiuiIVKiOLpfYk7N46TSy8ubTonmneY9vrpHNAnp0QBt2BxWV9dO3/j+BoVAb+a5G6YDPW3M5HOdMWQ=="
+      "version": "2.1.0",
+      "resolved": "https://registry.npmjs.org/mimic-fn/-/mimic-fn-2.1.0.tgz",
+      "integrity": "sha512-OqbOk5oEQeAZ8WXWydlu9HJjz9WVdEIvamMCcXmuqUYjTknH/sqsWvhQ3vgwKFRR1HpjvNBKQ37nbJgYzGqGcg=="
     },
     "minimatch": {
       "version": "3.0.4",
@@ -2897,7 +2926,7 @@
     },
     "minimist": {
       "version": "1.2.0",
-      "resolved": "http://registry.npmjs.org/minimist/-/minimist-1.2.0.tgz",
+      "resolved": "https://registry.npmjs.org/minimist/-/minimist-1.2.0.tgz",
       "integrity": "sha1-o1AIsg9BOD7sH7kU9M1d95omQoQ="
     },
     "minipass": {
@@ -2938,7 +2967,7 @@
     },
     "mkdirp": {
       "version": "0.5.1",
-      "resolved": "http://registry.npmjs.org/mkdirp/-/mkdirp-0.5.1.tgz",
+      "resolved": "https://registry.npmjs.org/mkdirp/-/mkdirp-0.5.1.tgz",
       "integrity": "sha1-MAV0OOrGz3+MR2fzhkjWaX11yQM=",
       "requires": {
         "minimist": "0.0.8"
@@ -2946,7 +2975,7 @@
       "dependencies": {
         "minimist": {
           "version": "0.0.8",
-          "resolved": "http://registry.npmjs.org/minimist/-/minimist-0.0.8.tgz",
+          "resolved": "https://registry.npmjs.org/minimist/-/minimist-0.0.8.tgz",
           "integrity": "sha1-hX/Kv8M5fSYluCKCYuhqp6ARsF0="
         }
       }
@@ -2988,7 +3017,7 @@
     },
     "mute-stream": {
       "version": "0.0.7",
-      "resolved": "http://registry.npmjs.org/mute-stream/-/mute-stream-0.0.7.tgz",
+      "resolved": "https://registry.npmjs.org/mute-stream/-/mute-stream-0.0.7.tgz",
       "integrity": "sha1-MHXOk7whuPq0PhvE2n6BFe0ee6s=",
       "dev": true
     },
@@ -2998,9 +3027,9 @@
       "integrity": "sha512-oprzxd2zhfrJqEuB98qc1dRMMonClBQ57UPDjnbcrah4orEMTq1jq3+AcdFe5ePzdbJXI7zmdhfftIdMnhYFoQ=="
     },
     "nan": {
-      "version": "2.12.1",
-      "resolved": "https://registry.npmjs.org/nan/-/nan-2.12.1.tgz",
-      "integrity": "sha512-JY7V6lRkStKcKTvHO5NVSQRv+RV+FIL5pvDoLiAtSL9pKlC5x9PKQcZDsq7m4FO4d57mkhC6Z+QhAh3Jdk5JFw=="
+      "version": "2.13.2",
+      "resolved": "https://registry.npmjs.org/nan/-/nan-2.13.2.tgz",
+      "integrity": "sha512-TghvYc72wlMGMVMluVo9WRJc0mB8KxxF/gZ4YYFy7V2ZQX9l7rgbPg7vjS9mt6U5HXODVFVI2bOduCzwOMv/lw=="
     },
     "nanoassert": {
       "version": "1.1.0",
@@ -3037,13 +3066,23 @@
       "dev": true
     },
     "needle": {
-      "version": "2.2.4",
-      "resolved": "https://registry.npmjs.org/needle/-/needle-2.2.4.tgz",
-      "integrity": "sha512-HyoqEb4wr/rsoaIDfTH2aVL9nWtQqba2/HvMv+++m8u0dz808MaagKILxtfeSN7QU7nvbQ79zk3vYOJp9zsNEA==",
+      "version": "2.4.0",
+      "resolved": "https://registry.npmjs.org/needle/-/needle-2.4.0.tgz",
+      "integrity": "sha512-4Hnwzr3mi5L97hMYeNl8wRW/Onhy4nUKR/lVemJ8gJedxxUyBLm9kkrDColJvoSfwi0jCNhD+xCdOtiGDQiRZg==",
       "requires": {
-        "debug": "^2.1.2",
+        "debug": "^3.2.6",
         "iconv-lite": "^0.4.4",
         "sax": "^1.2.4"
+      },
+      "dependencies": {
+        "debug": {
+          "version": "3.2.6",
+          "resolved": "https://registry.npmjs.org/debug/-/debug-3.2.6.tgz",
+          "integrity": "sha512-mel+jf7nrtEl5Pn1Qx46zARXKDpBbvzezse7p7LqINmdoIk8PYP5SySaxEmYv6TZ0JyEKA1hsCId6DIhgITtWQ==",
+          "requires": {
+            "ms": "^2.1.1"
+          }
+        }
       }
     },
     "network-address": {
@@ -3057,9 +3096,9 @@
       "integrity": "sha512-1nh45deeb5olNY7eX82BkPO7SSxR5SSYJiPTrTdFUVYwAl8CKMA5N9PjTYkHiRjisVcxcQ1HXdLhx2qxxJzLNQ=="
     },
     "node-gyp-build": {
-      "version": "3.7.0",
-      "resolved": "https://registry.npmjs.org/node-gyp-build/-/node-gyp-build-3.7.0.tgz",
-      "integrity": "sha512-L/Eg02Epx6Si2NXmedx+Okg+4UHqmaf3TNcxd50SF9NQGcJaON3AtU++kax69XV7YWz4tUspqZSAsVofhFKG2w=="
+      "version": "3.9.0",
+      "resolved": "https://registry.npmjs.org/node-gyp-build/-/node-gyp-build-3.9.0.tgz",
+      "integrity": "sha512-zLcTg6P4AbcHPq465ZMFNXx7XpKKJh+7kkN699NiQWisR2uWYOWNWqRHAmbnmKiL4e9aLSlmy5U7rEMUXV59+A=="
     },
     "node-pre-gyp": {
       "version": "0.11.0",
@@ -3193,16 +3232,6 @@
         "array-slice": "^1.0.0",
         "for-own": "^1.0.0",
         "isobject": "^3.0.0"
-      },
-      "dependencies": {
-        "for-own": {
-          "version": "1.0.0",
-          "resolved": "https://registry.npmjs.org/for-own/-/for-own-1.0.0.tgz",
-          "integrity": "sha1-xjMy9BXO3EsE2/5wz4NklMU8tEs=",
-          "requires": {
-            "for-in": "^1.0.1"
-          }
-        }
       }
     },
     "object.map": {
@@ -3212,16 +3241,6 @@
       "requires": {
         "for-own": "^1.0.0",
         "make-iterator": "^1.0.0"
-      },
-      "dependencies": {
-        "for-own": {
-          "version": "1.0.0",
-          "resolved": "https://registry.npmjs.org/for-own/-/for-own-1.0.0.tgz",
-          "integrity": "sha1-xjMy9BXO3EsE2/5wz4NklMU8tEs=",
-          "requires": {
-            "for-in": "^1.0.1"
-          }
-        }
       }
     },
     "object.omit": {
@@ -3231,6 +3250,16 @@
       "requires": {
         "for-own": "^0.1.4",
         "is-extendable": "^0.1.1"
+      },
+      "dependencies": {
+        "for-own": {
+          "version": "0.1.5",
+          "resolved": "https://registry.npmjs.org/for-own/-/for-own-0.1.5.tgz",
+          "integrity": "sha1-UmXGgaTylNq78XyVCbZ2OqhFEM4=",
+          "requires": {
+            "for-in": "^1.0.1"
+          }
+        }
       }
     },
     "object.pick": {
@@ -3261,6 +3290,14 @@
       "dev": true,
       "requires": {
         "mimic-fn": "^1.0.0"
+      },
+      "dependencies": {
+        "mimic-fn": {
+          "version": "1.2.0",
+          "resolved": "https://registry.npmjs.org/mimic-fn/-/mimic-fn-1.2.0.tgz",
+          "integrity": "sha512-jf84uxzwiuiIVKiOLpfYk7N46TSy8ubTonmneY9vrpHNAnp0QBt2BxWV9dO3/j+BoVAb+a5G6YDPW3M5HOdMWQ==",
+          "dev": true
+        }
       }
     },
     "optionator": {
@@ -3279,7 +3316,7 @@
     },
     "os-homedir": {
       "version": "1.0.2",
-      "resolved": "http://registry.npmjs.org/os-homedir/-/os-homedir-1.0.2.tgz",
+      "resolved": "https://registry.npmjs.org/os-homedir/-/os-homedir-1.0.2.tgz",
       "integrity": "sha1-/7xJiDNuDoM94MFox+8VISGqf7M="
     },
     "os-locale": {
@@ -3300,7 +3337,7 @@
     },
     "os-tmpdir": {
       "version": "1.0.2",
-      "resolved": "http://registry.npmjs.org/os-tmpdir/-/os-tmpdir-1.0.2.tgz",
+      "resolved": "https://registry.npmjs.org/os-tmpdir/-/os-tmpdir-1.0.2.tgz",
       "integrity": "sha1-u+Z0BseaqFxc/sdm/lc0VV36EnQ="
     },
     "osenv": {
@@ -3324,7 +3361,7 @@
     },
     "p-is-promise": {
       "version": "1.1.0",
-      "resolved": "http://registry.npmjs.org/p-is-promise/-/p-is-promise-1.1.0.tgz",
+      "resolved": "https://registry.npmjs.org/p-is-promise/-/p-is-promise-1.1.0.tgz",
       "integrity": "sha1-nJRWmJ6fZYgBewQ01WCXZ1w9oF4="
     },
     "parse-dat-url": {
@@ -3351,6 +3388,21 @@
         "is-dotfile": "^1.0.0",
         "is-extglob": "^1.0.0",
         "is-glob": "^2.0.0"
+      },
+      "dependencies": {
+        "is-extglob": {
+          "version": "1.0.0",
+          "resolved": "https://registry.npmjs.org/is-extglob/-/is-extglob-1.0.0.tgz",
+          "integrity": "sha1-rEaBd8SUNAWgkvyPKXYMb/xiBsA="
+        },
+        "is-glob": {
+          "version": "2.0.1",
+          "resolved": "https://registry.npmjs.org/is-glob/-/is-glob-2.0.1.tgz",
+          "integrity": "sha1-0Jb5JqPe1WAPP9/ZEZjLCIjC2GM=",
+          "requires": {
+            "is-extglob": "^1.0.0"
+          }
+        }
       }
     },
     "parse-passwd": {
@@ -3365,7 +3417,7 @@
     },
     "path-is-absolute": {
       "version": "1.0.1",
-      "resolved": "http://registry.npmjs.org/path-is-absolute/-/path-is-absolute-1.0.1.tgz",
+      "resolved": "https://registry.npmjs.org/path-is-absolute/-/path-is-absolute-1.0.1.tgz",
       "integrity": "sha1-F0uSaHNVNP+8es5r9TpanhtcX18="
     },
     "path-is-inside": {
@@ -3468,6 +3520,19 @@
             "is-extglob": "^1.0.0"
           }
         },
+        "is-extglob": {
+          "version": "1.0.0",
+          "resolved": "https://registry.npmjs.org/is-extglob/-/is-extglob-1.0.0.tgz",
+          "integrity": "sha1-rEaBd8SUNAWgkvyPKXYMb/xiBsA="
+        },
+        "is-glob": {
+          "version": "2.0.1",
+          "resolved": "https://registry.npmjs.org/is-glob/-/is-glob-2.0.1.tgz",
+          "integrity": "sha1-0Jb5JqPe1WAPP9/ZEZjLCIjC2GM=",
+          "requires": {
+            "is-extglob": "^1.0.0"
+          }
+        },
         "kind-of": {
           "version": "3.2.2",
           "resolved": "https://registry.npmjs.org/kind-of/-/kind-of-3.2.2.tgz",
@@ -3638,9 +3703,9 @@
       "integrity": "sha512-N5ZAX4/LxJmF+7wN74pUD6qAh9/wnvdQcjq9TZjevvXzSUo7bfmw91saqMjzGS2xq91/odN2dW/WOl7qQHNDGA=="
     },
     "random-access-file": {
-      "version": "2.1.0",
-      "resolved": "https://registry.npmjs.org/random-access-file/-/random-access-file-2.1.0.tgz",
-      "integrity": "sha512-W2hY3DboLETMclybTVzyqCNVKx1MjqUwZPzkpkkMD2t9mbGEtkV2SKWPqAJ/FTrAtnWB7aGwl0NDUS82da0KdQ==",
+      "version": "2.1.1",
+      "resolved": "https://registry.npmjs.org/random-access-file/-/random-access-file-2.1.1.tgz",
+      "integrity": "sha512-l8I6RlabShHmNPRqZ0f4mlHgkhgdrd5Prd4RXM9tOizUOMrTglKHB+s78pZZbIsJgny8E9gw0DRqCy3YVLxxZg==",
       "requires": {
         "mkdirp": "^0.5.1",
         "random-access-storage": "^1.1.1"
@@ -3691,9 +3756,9 @@
       }
     },
     "range-parser": {
-      "version": "1.2.0",
-      "resolved": "https://registry.npmjs.org/range-parser/-/range-parser-1.2.0.tgz",
-      "integrity": "sha1-9JvmtIeJTdxA3MlKMi9hEJLgDV4="
+      "version": "1.2.1",
+      "resolved": "https://registry.npmjs.org/range-parser/-/range-parser-1.2.1.tgz",
+      "integrity": "sha512-Hrgsx+orqoygnmhFbKaHE6c296J+HTAQXoxEF6gNupROmmGJRoyzfG3ccAveqCBrwr/2yxQ5BVd/GTl5agOwSg=="
     },
     "rc": {
       "version": "1.2.8",
@@ -3708,7 +3773,7 @@
     },
     "readable-stream": {
       "version": "2.3.6",
-      "resolved": "http://registry.npmjs.org/readable-stream/-/readable-stream-2.3.6.tgz",
+      "resolved": "https://registry.npmjs.org/readable-stream/-/readable-stream-2.3.6.tgz",
       "integrity": "sha512-tQtKA9WIAhBF3+VLAseyMqZeBjW0AHJoxOtYqSUZNJxauErmLbVm2FW1y+J/YA9dUrAC39ITejlZWhVIwawkKw==",
       "requires": {
         "core-util-is": "~1.0.0",
@@ -3737,9 +3802,9 @@
       }
     },
     "regenerator-runtime": {
-      "version": "0.12.1",
-      "resolved": "https://registry.npmjs.org/regenerator-runtime/-/regenerator-runtime-0.12.1.tgz",
-      "integrity": "sha512-odxIc1/vDlo4iZcfXqRYFj0vpXFNoGdKMAUieAlFYO6m/nl5e9KR/beGf41z4a1FI+aQgtjhuaSlDxQ0hmkrHg=="
+      "version": "0.13.2",
+      "resolved": "https://registry.npmjs.org/regenerator-runtime/-/regenerator-runtime-0.13.2.tgz",
+      "integrity": "sha512-S/TQAZJO+D3m9xeN1WTI8dLKBBiRgXBlTJvbWjCThHWZj9EvHK70Ff50/tYj2J/fvBY6JtFVwRuazHN2E7M9BA=="
     },
     "regex-cache": {
       "version": "0.4.4",
@@ -3760,7 +3825,7 @@
     },
     "regexpp": {
       "version": "1.1.0",
-      "resolved": "http://registry.npmjs.org/regexpp/-/regexpp-1.1.0.tgz",
+      "resolved": "https://registry.npmjs.org/regexpp/-/regexpp-1.1.0.tgz",
       "integrity": "sha512-LOPw8FpgdQF9etWMaAfG/WRthIdXJGYp4mJ2Jgn/2lpkbod9jPn0t9UqN7AxBOKNfzRbYyVfgc7Vk4t/MpnXgw==",
       "dev": true
     },
@@ -3808,7 +3873,7 @@
     },
     "require-uncached": {
       "version": "1.0.3",
-      "resolved": "http://registry.npmjs.org/require-uncached/-/require-uncached-1.0.3.tgz",
+      "resolved": "https://registry.npmjs.org/require-uncached/-/require-uncached-1.0.3.tgz",
       "integrity": "sha1-Tg1W1slmL9MeQwEcS5WqSZVUIdM=",
       "dev": true,
       "requires": {
@@ -3817,9 +3882,9 @@
       }
     },
     "resolve": {
-      "version": "1.10.0",
-      "resolved": "https://registry.npmjs.org/resolve/-/resolve-1.10.0.tgz",
-      "integrity": "sha512-3sUr9aq5OfSg2S9pNtPA9hL1FVEAjvfOC4leW0SNf/mpnaakz2a9femSd6LqAww2RaFctwyf1lCqnTHuF1rxDg==",
+      "version": "1.10.1",
+      "resolved": "https://registry.npmjs.org/resolve/-/resolve-1.10.1.tgz",
+      "integrity": "sha512-KuIe4mf++td/eFb6wkaPbMDnP6kObCaEtIDuHOUED6MNUo4K670KZUHuuvYPZDxNF0WVLw49n06M2m2dXphEzA==",
       "requires": {
         "path-parse": "^1.0.6"
       }
@@ -3903,7 +3968,7 @@
     },
     "safe-regex": {
       "version": "1.1.0",
-      "resolved": "http://registry.npmjs.org/safe-regex/-/safe-regex-1.1.0.tgz",
+      "resolved": "https://registry.npmjs.org/safe-regex/-/safe-regex-1.1.0.tgz",
       "integrity": "sha1-QKNmnzsHfR6UPURinhV91IAjvy4=",
       "requires": {
         "ret": "~0.1.10"
@@ -4139,9 +4204,9 @@
       }
     },
     "sodium-native": {
-      "version": "2.2.3",
-      "resolved": "https://registry.npmjs.org/sodium-native/-/sodium-native-2.2.3.tgz",
-      "integrity": "sha512-0rQvKwlWW86YmmAhosnJ6/2PR3mdAtfuWW147L4x3/gwfL7XiJ7mf2BPvBwU16vsYQNY1yxOQg9YT/MN6qoZOA==",
+      "version": "2.4.2",
+      "resolved": "https://registry.npmjs.org/sodium-native/-/sodium-native-2.4.2.tgz",
+      "integrity": "sha512-qwHcUnzFpRSGSm6F49j/h5SnxPFBgSNdDwZkAqjvuAoHQIVBFOXYb+oCUTJV80K5hRqSYCihpbX06vbrtPbilg==",
       "optional": true,
       "requires": {
         "ini": "^1.3.5",
@@ -4243,24 +4308,17 @@
     },
     "sprintf-js": {
       "version": "1.0.3",
-      "resolved": "http://registry.npmjs.org/sprintf-js/-/sprintf-js-1.0.3.tgz",
+      "resolved": "https://registry.npmjs.org/sprintf-js/-/sprintf-js-1.0.3.tgz",
       "integrity": "sha1-BOaSb2YolTVPPdAVIDYzuFcpfiw="
     },
     "sqlite3": {
-      "version": "4.0.6",
-      "resolved": "https://registry.npmjs.org/sqlite3/-/sqlite3-4.0.6.tgz",
-      "integrity": "sha512-EqBXxHdKiwvNMRCgml86VTL5TK1i0IKiumnfxykX0gh6H6jaKijAXvE9O1N7+omfNSawR2fOmIyJZcfe8HYWpw==",
+      "version": "4.0.8",
+      "resolved": "https://registry.npmjs.org/sqlite3/-/sqlite3-4.0.8.tgz",
+      "integrity": "sha512-kgwHu4j10KhpCHtx//dejd/tVQot7jc3sw+Sn0vMuKOw0X00Ckyg9VceKgzPyGmmz+zEoYue9tOLriWTvYy0ww==",
       "requires": {
-        "nan": "~2.10.0",
+        "nan": "^2.12.1",
         "node-pre-gyp": "^0.11.0",
         "request": "^2.87.0"
-      },
-      "dependencies": {
-        "nan": {
-          "version": "2.10.0",
-          "resolved": "http://registry.npmjs.org/nan/-/nan-2.10.0.tgz",
-          "integrity": "sha512-bAdJv7fBLhWC+/Bls0Oza+mvTaNQtP+1RyhhhvD95pgUJz6XM5IzgmxOkItJ9tkoCiplvAnXI1tNmmUD/eScyA=="
-        }
       }
     },
     "sshpk": {
@@ -4344,7 +4402,7 @@
     },
     "string-width": {
       "version": "1.0.2",
-      "resolved": "http://registry.npmjs.org/string-width/-/string-width-1.0.2.tgz",
+      "resolved": "https://registry.npmjs.org/string-width/-/string-width-1.0.2.tgz",
       "integrity": "sha1-EYvfW4zcUaKn5w0hHgfisLmxB9M=",
       "requires": {
         "code-point-at": "^1.0.0",
@@ -4354,7 +4412,7 @@
     },
     "string_decoder": {
       "version": "1.1.1",
-      "resolved": "http://registry.npmjs.org/string_decoder/-/string_decoder-1.1.1.tgz",
+      "resolved": "https://registry.npmjs.org/string_decoder/-/string_decoder-1.1.1.tgz",
       "integrity": "sha512-n/ShnvDi6FHbbVfviro+WojiFzv+s8MPMHBczVePfUpDJLwoLT0ht1l4YwBCbi8pJAveEEdnkHyPyTP/mzRfwg==",
       "requires": {
         "safe-buffer": "~5.1.0"
@@ -4362,7 +4420,7 @@
     },
     "strip-ansi": {
       "version": "3.0.1",
-      "resolved": "http://registry.npmjs.org/strip-ansi/-/strip-ansi-3.0.1.tgz",
+      "resolved": "https://registry.npmjs.org/strip-ansi/-/strip-ansi-3.0.1.tgz",
       "integrity": "sha1-ajhfuIU9lS1f8F0Oiq+UJ43GPc8=",
       "requires": {
         "ansi-regex": "^2.0.0"
@@ -4370,7 +4428,7 @@
     },
     "strip-eof": {
       "version": "1.0.0",
-      "resolved": "http://registry.npmjs.org/strip-eof/-/strip-eof-1.0.0.tgz",
+      "resolved": "https://registry.npmjs.org/strip-eof/-/strip-eof-1.0.0.tgz",
       "integrity": "sha1-u0P/VZim6wXYm1n80SnJgzE2Br8="
     },
     "strip-json-comments": {
@@ -4380,7 +4438,7 @@
     },
     "supports-color": {
       "version": "2.0.0",
-      "resolved": "http://registry.npmjs.org/supports-color/-/supports-color-2.0.0.tgz",
+      "resolved": "https://registry.npmjs.org/supports-color/-/supports-color-2.0.0.tgz",
       "integrity": "sha1-U10EXOa2Nj+kARcIRimZXp3zJMc=",
       "dev": true
     },
@@ -4423,7 +4481,7 @@
         },
         "fast-deep-equal": {
           "version": "1.1.0",
-          "resolved": "http://registry.npmjs.org/fast-deep-equal/-/fast-deep-equal-1.1.0.tgz",
+          "resolved": "https://registry.npmjs.org/fast-deep-equal/-/fast-deep-equal-1.1.0.tgz",
           "integrity": "sha1-wFNHeBfIa1HaqFPIHgWbcz0CNhQ=",
           "dev": true
         },
@@ -4475,9 +4533,9 @@
       }
     },
     "tarn": {
-      "version": "1.1.4",
-      "resolved": "https://registry.npmjs.org/tarn/-/tarn-1.1.4.tgz",
-      "integrity": "sha512-j4samMCQCP5+6Il9/cxCqBd3x4vvlLeVdoyGex0KixPKl4F8LpNbDSC6NDhjianZgUngElRr9UI1ryZqJDhwGg=="
+      "version": "1.1.5",
+      "resolved": "https://registry.npmjs.org/tarn/-/tarn-1.1.5.tgz",
+      "integrity": "sha512-PMtJ3HCLAZeedWjJPgGnCvcphbCOMbtZpjKgLq3qM5Qq9aQud+XHrL0WlrlgnTyS8U+jrjGbEXprFcQrxPy52g=="
     },
     "temp-dir": {
       "version": "1.0.0",
@@ -4496,7 +4554,7 @@
       "dependencies": {
         "pify": {
           "version": "2.3.0",
-          "resolved": "http://registry.npmjs.org/pify/-/pify-2.3.0.tgz",
+          "resolved": "https://registry.npmjs.org/pify/-/pify-2.3.0.tgz",
           "integrity": "sha1-7RQaasBDqEnqWISY59yosVMw6Qw="
         }
       }
@@ -4519,7 +4577,7 @@
     },
     "through": {
       "version": "2.3.8",
-      "resolved": "http://registry.npmjs.org/through/-/through-2.3.8.tgz",
+      "resolved": "https://registry.npmjs.org/through/-/through-2.3.8.tgz",
       "integrity": "sha1-DdTJ/6q8NXlgsbckEV1+Doai4fU="
     },
     "through2": {
@@ -4533,7 +4591,7 @@
     },
     "thunky": {
       "version": "0.1.0",
-      "resolved": "http://registry.npmjs.org/thunky/-/thunky-0.1.0.tgz",
+      "resolved": "https://registry.npmjs.org/thunky/-/thunky-0.1.0.tgz",
       "integrity": "sha1-vzAUaCTituZ7Dy16Ssi+smkIaE4="
     },
     "tildify": {
@@ -4817,9 +4875,9 @@
       },
       "dependencies": {
         "readable-stream": {
-          "version": "3.1.1",
-          "resolved": "https://registry.npmjs.org/readable-stream/-/readable-stream-3.1.1.tgz",
-          "integrity": "sha512-DkN66hPyqDhnIQ6Jcsvx9bFjhw214O4poMBcIMgPVpQvNy9a0e0Uhg5SqySyDKAmUlwt8LonTBz1ezOnM8pUdA==",
+          "version": "3.3.0",
+          "resolved": "https://registry.npmjs.org/readable-stream/-/readable-stream-3.3.0.tgz",
+          "integrity": "sha512-EsI+s3k3XsW+fU8fQACLN59ky34AZ14LoeVZpYwmZvldCFo0r0gnelwF2TcMjLor/BTL5aDJVBMkss0dthToPw==",
           "requires": {
             "inherits": "^2.0.3",
             "string_decoder": "^1.1.1",
@@ -4839,9 +4897,9 @@
       "integrity": "sha512-yXJmeNaw3DnnKAOKJE51sL/ZaYfWJRl1pK9dr19YFCu0ObS231AB1/LbqTKRAQ5kw8A90rA6fr4riOUpTZvQZA=="
     },
     "v8flags": {
-      "version": "3.1.2",
-      "resolved": "https://registry.npmjs.org/v8flags/-/v8flags-3.1.2.tgz",
-      "integrity": "sha512-MtivA7GF24yMPte9Rp/BWGCYQNaUj86zeYxV/x2RRJMKagImbbv3u8iJC57lNhWLPcGLJmHcHmFWkNsplbbLWw==",
+      "version": "3.1.3",
+      "resolved": "https://registry.npmjs.org/v8flags/-/v8flags-3.1.3.tgz",
+      "integrity": "sha512-amh9CCg3ZxkzQ48Mhcb8iX7xpAfYJgePHxWMQCBWECpOSqJUXgY26ncA61UTV0BkPqfhcy6mzwCIoP4ygxpW8w==",
       "requires": {
         "homedir-polyfill": "^1.0.1"
       }

From 72f1043270e4317911fa0bb596fffc21b54e883e Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 14 May 2019 14:00:35 -0500
Subject: [PATCH 171/245] Fix: watch user assets and bookmarks on add

---
 users/index.js | 18 ++++++++++++------
 1 file changed, 12 insertions(+), 6 deletions(-)

diff --git a/users/index.js b/users/index.js
index 929a1480..d18864d7 100644
--- a/users/index.js
+++ b/users/index.js
@@ -72,15 +72,11 @@ exports.setup = async function () {
     // fetch the user archive
     try {
       user.archive = await dat.library.getOrLoadArchive(user.url)
-      /* dont await */crawler.watchSite(user.archive)
+      startWatch(user)
       events.emit('load-user', user)
     } catch (err) {
       logger.error('Failed to load user', {details: {user, err}})
     }
-
-    // start any active processes
-    watchThumb(user)
-    watchAndSyncBookmarks(user)
   }))
 
   // remove any invalid users
@@ -195,7 +191,7 @@ exports.add = async function (url) {
 
   // fetch the user archive
   user.archive = await dat.library.getOrLoadArchive(user.url)
-  /* dont await */crawler.watchSite(user.archive)
+  startWatch(user)
   events.emit('load-user', user)
 }
 
@@ -320,6 +316,16 @@ async function validateUserUrl (url) {
   }
 }
 
+/**
+ * @param {Object} user
+ * @returns {void}
+ */
+function startWatch (user) {
+  /* dont await */crawler.watchSite(user.archive)
+  watchThumb(user)
+  watchAndSyncBookmarks(user)
+}
+
 /**
  * @param {Object} user
  * @returns {void}

From c0a476557dc889e804ddd3005cbb42f097b29662 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 11 Jun 2019 11:38:35 -0500
Subject: [PATCH 172/245] Fix: properly handle bookmark not found

---
 web-apis/bg/bookmarks.js | 1 +
 1 file changed, 1 insertion(+)

diff --git a/web-apis/bg/bookmarks.js b/web-apis/bg/bookmarks.js
index 56de13f5..2772a604 100644
--- a/web-apis/bg/bookmarks.js
+++ b/web-apis/bg/bookmarks.js
@@ -232,6 +232,7 @@ async function assertPermission (sender, perm) {
 }
 
 function normalizeInternalBookmark (bookmark, user) {
+  if (!bookmark) return null
   bookmark.record = null
   bookmark.author = user
   bookmark.isOwner = true

From 817793039cc6d73dc2faecfdbbec856bc5686f96 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 11 Jun 2019 11:38:50 -0500
Subject: [PATCH 173/245] Bump discovery-swarm@6.0.0

---
 package-lock.json | 31 ++++++++++---------------------
 package.json      |  6 +++---
 2 files changed, 13 insertions(+), 24 deletions(-)

diff --git a/package-lock.json b/package-lock.json
index af08aef9..759a29c1 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -1010,9 +1010,9 @@
       }
     },
     "discovery-swarm": {
-      "version": "5.1.4",
-      "resolved": "https://registry.npmjs.org/discovery-swarm/-/discovery-swarm-5.1.4.tgz",
-      "integrity": "sha512-vkg0bv+FUwSuPxBWzdNPQVNmXQlIbvz1Ygi+A1XefNUhEzfmM+RNndjtjlDgxD/ZUhFir9PX7Hw9iIDVujsOoA==",
+      "version": "6.0.0",
+      "resolved": "https://registry.npmjs.org/discovery-swarm/-/discovery-swarm-6.0.0.tgz",
+      "integrity": "sha512-ByfwygfLCB4umpSBVz9tGxgmng1D3YWg6A80cip8dgdpC5dRyGsL5w6KoC9srQ15xydKtYPgcxUC2YtSzPCtHA==",
       "requires": {
         "connections": "^1.4.2",
         "debug": "^4.1.1",
@@ -1020,7 +1020,7 @@
         "length-prefixed-message": "^3.0.3",
         "pump": "^3.0.0",
         "to-buffer": "^1.0.1",
-        "utp-native": "^1.7.2"
+        "utp-native": "^2.1.3"
       },
       "dependencies": {
         "debug": {
@@ -1030,17 +1030,6 @@
           "requires": {
             "ms": "^2.1.1"
           }
-        },
-        "utp-native": {
-          "version": "1.7.3",
-          "resolved": "https://registry.npmjs.org/utp-native/-/utp-native-1.7.3.tgz",
-          "integrity": "sha512-vRAKaS8WcYNgzbxyH2LdheqgL4sQLis8LXl7r/mN+O4mpWlUpoCsTtietxepLrft2q0TFA2gaIvSWN1iRkzW/w==",
-          "optional": true,
-          "requires": {
-            "nan": "^2.5.1",
-            "node-gyp-build": "^3.0.0",
-            "readable-stream": "^2.2.2"
-          }
         }
       }
     },
@@ -3703,9 +3692,9 @@
       "integrity": "sha512-N5ZAX4/LxJmF+7wN74pUD6qAh9/wnvdQcjq9TZjevvXzSUo7bfmw91saqMjzGS2xq91/odN2dW/WOl7qQHNDGA=="
     },
     "random-access-file": {
-      "version": "2.1.1",
-      "resolved": "https://registry.npmjs.org/random-access-file/-/random-access-file-2.1.1.tgz",
-      "integrity": "sha512-l8I6RlabShHmNPRqZ0f4mlHgkhgdrd5Prd4RXM9tOizUOMrTglKHB+s78pZZbIsJgny8E9gw0DRqCy3YVLxxZg==",
+      "version": "2.1.2",
+      "resolved": "https://registry.npmjs.org/random-access-file/-/random-access-file-2.1.2.tgz",
+      "integrity": "sha512-dZo7HEcEPbZ/6XLXC4GXypiWvFbXVkdeMrJTi0B94pBJwddt/AvJh8GaQhso6KGYROGYCI/VWdHbmRDtkwT9pQ==",
       "requires": {
         "mkdirp": "^0.5.1",
         "random-access-storage": "^1.1.1"
@@ -4951,9 +4940,9 @@
       },
       "dependencies": {
         "readable-stream": {
-          "version": "3.3.0",
-          "resolved": "https://registry.npmjs.org/readable-stream/-/readable-stream-3.3.0.tgz",
-          "integrity": "sha512-EsI+s3k3XsW+fU8fQACLN59ky34AZ14LoeVZpYwmZvldCFo0r0gnelwF2TcMjLor/BTL5aDJVBMkss0dthToPw==",
+          "version": "3.4.0",
+          "resolved": "https://registry.npmjs.org/readable-stream/-/readable-stream-3.4.0.tgz",
+          "integrity": "sha512-jItXPLmrSR8jmTRmRWJXCnGJsfy85mB3Wd/uINMXA65yrnFo0cPClFIUWzo2najVNSl+mx7/4W8ttlLWJe99pQ==",
           "requires": {
             "inherits": "^2.0.3",
             "string_decoder": "^1.1.1",
diff --git a/package.json b/package.json
index bbfba9e2..69c7ae8d 100644
--- a/package.json
+++ b/package.json
@@ -41,7 +41,7 @@
     "datland-swarm-defaults": "^1.0.2",
     "diff": "^3.5.0",
     "diff-file-tree": "^2.2.0",
-    "discovery-swarm": "^5.1.4",
+    "discovery-swarm": "^6.0.0",
     "emit-stream": "^0.1.2",
     "fs-jetpack": "^1.3.1",
     "fs-reverse": "0.0.3",
@@ -73,7 +73,7 @@
     "pauls-dat-api": "^8.1.0",
     "pify": "^3.0.0",
     "pump": "^3.0.0",
-    "random-access-file": "^2.1.0",
+    "random-access-file": "^2.1.2",
     "random-access-indexed-file": "^2.0.0",
     "range-parser": "^1.2.0",
     "rimraf": "^2.6.3",
@@ -81,7 +81,7 @@
     "semver": "^5.7.0",
     "slugify": "^1.3.4",
     "sodium-signatures": "^2.1.1",
-    "spellchecker": "beakerbrowser/node-spellchecker#ce6402cb062823587986f3cd38debd01ddf3bffb",
+    "spellchecker": "github:beakerbrowser/node-spellchecker#ce6402cb062823587986f3cd38debd01ddf3bffb",
     "split2": "^2.2.0",
     "sqlite3": "^4.0.6",
     "stream-throttle": "^0.1.3",

From 27f6733ca1d86dcbb14bccc60d9a0d6a97f1bee4 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 12 Jun 2019 15:06:56 -0500
Subject: [PATCH 174/245] Refactor unwalled-garden-graph Web API ->
 unwalled-garden-follows

---
 crawler/follows.js                            | 382 +++++++++++++++
 crawler/graph.js                              | 461 ------------------
 crawler/index.js                              |   6 +-
 crawler/search.js                             |  24 +-
 dbs/profile-data-db.js                        |   3 +-
 dbs/schemas/profile-data.sql.js               |   6 +-
 dbs/schemas/profile-data.v26.sql.js           |  14 +
 lib/db.js                                     |   6 +-
 package-lock.json                             |  68 +--
 package.json                                  |   6 +-
 users/index.js                                |   8 +-
 web-apis/bg.js                                |   6 +-
 web-apis/bg/unwalled-garden-follows.js        | 192 ++++++++
 web-apis/bg/unwalled-garden-graph.js          | 218 ---------
 web-apis/fg/navigator-import.js               |   6 +-
 .../external/unwalled-garden-follows.js       |   7 +
 .../external/unwalled-garden-graph.js         |   8 -
 17 files changed, 668 insertions(+), 753 deletions(-)
 create mode 100644 crawler/follows.js
 delete mode 100644 crawler/graph.js
 create mode 100644 dbs/schemas/profile-data.v26.sql.js
 create mode 100644 web-apis/bg/unwalled-garden-follows.js
 delete mode 100644 web-apis/bg/unwalled-garden-graph.js
 create mode 100644 web-apis/manifests/external/unwalled-garden-follows.js
 delete mode 100644 web-apis/manifests/external/unwalled-garden-graph.js

diff --git a/crawler/follows.js b/crawler/follows.js
new file mode 100644
index 00000000..f01528b9
--- /dev/null
+++ b/crawler/follows.js
@@ -0,0 +1,382 @@
+const assert = require('assert')
+const _difference = require('lodash.difference')
+const Events = require('events')
+const {URL} = require('url')
+const Ajv = require('ajv')
+const logger = require('../logger').child({category: 'crawler', dataset: 'follows'})
+const lock = require('../lib/lock')
+const knex = require('../lib/knex')
+const db = require('../dbs/profile-data-db')
+const crawler = require('./index')
+const siteDescriptions = require('./site-descriptions')
+const {doCrawl, doCheckpoint, emitProgressEvent} = require('./util')
+const followsSchema = require('./json-schemas/follows')
+
+// constants
+// =
+
+const TABLE_VERSION = 1
+const JSON_TYPE = 'unwalled.garden/follows'
+const JSON_PATH = '/data/follows.json'
+
+// typedefs
+// =
+
+/**
+ * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
+ * @typedef {import('./util').CrawlSourceRecord} CrawlSourceRecord
+ * @typedef {import('./site-descriptions').SiteDescription} SiteDescription
+ *
+ * @typedef {Object} Follow
+ * @prop {SiteDescription} author
+ * @prop {SiteDescription} subject
+ * @prop {string} visibility
+ */
+
+// globals
+// =
+
+const events = new Events()
+const ajv = (new Ajv())
+const validateFollows = ajv.compile(followsSchema)
+
+// exported api
+// =
+
+exports.on = events.on.bind(events)
+exports.addListener = events.addListener.bind(events)
+exports.removeListener = events.removeListener.bind(events)
+
+/**
+ * @description
+ * Crawl the given site for follows.
+ *
+ * @param {InternalDatArchive} archive - site to crawl.
+ * @param {CrawlSourceRecord} crawlSource - internal metadata about the crawl target.
+ * @returns {Promise<void>}
+ */
+exports.crawlSite = async function (archive, crawlSource) {
+  return doCrawl(archive, crawlSource, 'crawl_follows', TABLE_VERSION, async ({changes, resetRequired}) => {
+    const supressEvents = resetRequired === true // dont emit when replaying old info
+    logger.silly('Crawling follows', {details: {url: archive.url, numChanges: changes.length, resetRequired}})
+    if (resetRequired) {
+      // reset all data
+      logger.debug('Resetting dataset', {details: {url: archive.url}})
+      await db.run(`
+        DELETE FROM crawl_follows WHERE crawlSourceId = ?
+      `, [crawlSource.id])
+      await doCheckpoint('crawl_follows', TABLE_VERSION, crawlSource, 0)
+    }
+
+    // did follows.json change?
+    var change = changes.find(c => c.name === JSON_PATH)
+    if (!change) {
+      logger.debug('No change detected to follows record', {details: {url: archive.url}})
+      if (changes.length) {
+        await doCheckpoint('crawl_follows', TABLE_VERSION, crawlSource, changes[changes.length - 1].version)
+      }
+      return
+    }
+
+    logger.verbose('Change detected to follows record', {details: {url: archive.url}})
+    emitProgressEvent(archive.url, 'crawl_follows', 0, 1)
+
+    // read and validate
+    try {
+      var followsJson = await readFollowsFile(archive)
+    } catch (err) {
+      logger.warn('Failed to read follows file', {details: {url: archive.url, err}})
+      return
+    }
+
+    // diff against the current follows
+    var currentFollowObjects = await list({filters: {authors: archive.url}})
+    var currentFollows = currentFollowObjects.map(({subject}) => subject.url)
+    var newFollows = followsJson.urls
+    var adds = _difference(newFollows, currentFollows)
+    var removes = _difference(currentFollows, newFollows)
+    logger.silly(`Adding ${adds.length} follows and removing ${removes.length} follows`, {details: {url: archive.url}})
+
+    // write updates
+    for (let add of adds) {
+      try {
+        await db.run(`
+          INSERT INTO crawl_follows (crawlSourceId, destUrl, crawledAt) VALUES (?, ?, ?)
+        `, [crawlSource.id, add, Date.now()])
+      } catch (e) {
+        if (e.code === 'SQLITE_CONSTRAINT') {
+          // uniqueness constraint probably failed, which means we got a duplicate somehow
+          // dont worry about it
+          logger.warn('Attempted to insert duplicate follow record', {details: {url: archive.url, add}})
+        } else {
+          throw e
+        }
+      }
+      if (!supressEvents) {
+        events.emit('follow-added', archive.url, add)
+      }
+    }
+    for (let remove of removes) {
+      await db.run(`
+        DELETE FROM crawl_follows WHERE crawlSourceId = ? AND destUrl = ?
+      `, [crawlSource.id, remove])
+      if (supressEvents) {
+        events.emit('follow-removed', archive.url, remove)
+      }
+    }
+
+    // write checkpoint as success
+    logger.silly(`Finished crawling follows`, {details: {url: archive.url}})
+    await doCheckpoint('crawl_follows', TABLE_VERSION, crawlSource, changes[changes.length - 1].version)
+    emitProgressEvent(archive.url, 'crawl_follows', 1, 1)
+  })
+}
+
+/**
+ * @description
+ * List crawled follows.
+ *
+ * @param {Object} [opts]
+ * @param {Object} [opts.filters]
+ * @param {string|string[]} [opts.filters.authors]
+ * @param {string|string[]} [opts.filters.subjects]
+ * @param {string} [opts.filters.visibility]
+ * @param {string} [opts.sortBy]
+ * @param {number} [opts.offset=0]
+ * @param {number} [opts.limit]
+ * @param {boolean} [opts.reverse]
+ * @returns {Promise<Array<Follow>>}
+ */
+const list = exports.list = async function (opts) {
+  // TODO: handle visibility
+  // TODO: sortBy options
+
+  // validate & parse params
+  if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
+  if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+  if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+  if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+  if (opts && opts.filters) {
+    if ('authors' in opts.filters) {
+      if (Array.isArray(opts.filters.authors)) {
+        assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        opts.filters.authors = [opts.filters.authors]
+      }
+      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url))
+    }
+    if ('subjects' in opts.filters) {
+      if (Array.isArray(opts.filters.subjects)) {
+        assert(opts.filters.subjects.every(v => typeof v === 'string'), 'Subjects filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.subjects === 'string', 'Subjects filter must be a string or array of strings')
+        opts.filters.subjects = [opts.filters.subjects]
+      }
+      opts.filters.subjects = opts.filters.subjects.map(url => toOrigin(url))
+    }
+    if ('visibility' in opts.filters) {
+      assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+    }
+  }
+
+  // execute query
+  let sql = knex('crawl_follows')
+    .select('crawl_follows.*')
+    .select('crawl_sources.url AS authorUrl')
+    .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_follows.crawlSourceId')
+    .orderBy('crawl_follows.destUrl', opts.reverse ? 'DESC' : 'ASC')
+  if (opts.limit) sql = sql.limit(opts.limit)
+  if (opts.offset) sql = sql.offset(opts.offset)
+  if (opts && opts.filters && opts.filters.authors) {
+    sql = sql.whereIn('crawl_sources.url', opts.filters.authors)
+  }
+  if (opts && opts.filters && opts.filters.subjects) {
+    sql = sql.whereIn('crawl_follows.destUrl', opts.filters.subjects)
+  }
+  var rows = await db.all(sql)
+
+  // massage results
+  return Promise.all(rows.map(async (row) => {
+    var author = toOrigin(row.authorUrl)
+    var subject = toOrigin(row.destUrl)
+    return {
+      author: await siteDescriptions.getBest({subject: author}),
+      subject: await siteDescriptions.getBest({subject: subject}),
+      visibility: 'public'
+    }
+  }))
+}
+
+/**
+ * @description
+ * Get an individual follow.
+ *
+ * @param {string} author - (URL) the site being queried.
+ * @param {string} subject - (URL) does a follow this site?
+ * @returns {Promise<Follow>}
+ */
+const get = exports.get = async function (author, subject) {
+  author = toOrigin(author)
+  subject = toOrigin(subject)
+  var res = await db.get(knex('crawl_follows')
+    .select('crawl_follows.*')
+    .select('crawl_sources.url AS authorUrl')
+    .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_follows.crawlSourceId')
+    .where('crawl_sources.url', author)
+    .where('crawl_follows.destUrl', subject))
+  if (!res) return null
+  return {
+    author: await siteDescriptions.getBest({subject: toOrigin(res.authorUrl)}),
+    subject: await siteDescriptions.getBest({subject: toOrigin(res.destUrl)}),
+    visibility: 'public'
+  }
+}
+
+/**
+ * @description
+ * Add a follow to the given archive.
+ *
+ * @param {InternalDatArchive} archive
+ * @param {string} subject
+ * @param {Object} [opts]
+ * @param {string} [opts.visibility]
+ * @returns {Promise<void>}
+ */
+exports.add = async function (archive, subject, opts) {
+  // TODO visibility
+
+  // normalize subject
+  subject = toOrigin(subject)
+  assert(typeof subject === 'string', 'Follow() must be given a valid URL')
+
+  // write new follows.json
+  await updateFollowsFile(archive, followsJson => {
+    if (!followsJson.urls.find(v => v === subject)) {
+      followsJson.urls.push(subject)
+    }
+  })
+
+  // capture site description
+  /* dont await */siteDescriptions.capture(archive, subject)
+}
+
+/**
+ * @description
+ * Edit a follow for the given archive.
+ *
+ * @param {InternalDatArchive} archive
+ * @param {string} subject
+ * @param {Object} [opts]
+ * @param {string} [opts.visibility]
+ * @returns {Promise<void>}
+ */
+exports.edit = async function (archive, subject, opts) {
+  // TODO visibility
+
+  // normalize subject
+  subject = toOrigin(subject)
+  assert(typeof subject === 'string', 'Follow() must be given a valid URL')
+
+  // write new follows.json
+  await updateFollowsFile(archive, followsJson => {
+    if (!followsJson.urls.find(v => v === subject)) {
+      followsJson.urls.push(subject)
+    }
+  })
+}
+
+/**
+ * @description
+ * Remove a follow from the given archive.
+ *
+ * @param {InternalDatArchive} archive
+ * @param {string} subject
+ * @returns {Promise<void>}
+ */
+exports.remove = async function (archive, subject) {
+  // TODO private follows
+
+  // normalize subject
+  subject = toOrigin(subject)
+  assert(typeof subject === 'string', 'Unfollow() must be given a valid URL')
+
+  // write new follows.json
+  await updateFollowsFile(archive, followsJson => {
+    var i = followsJson.urls.findIndex(v => v === subject)
+    if (i !== -1) {
+      followsJson.urls.splice(i, 1)
+    }
+  })
+}
+
+// internal methods
+// =
+
+/**
+ * @param {string} url
+ * @returns {string}
+ */
+function toOrigin (url) {
+  try {
+    var urlParsed = new URL(url)
+    return urlParsed.protocol + '//' + urlParsed.hostname
+  } catch (e) {
+    return null
+  }
+}
+
+/**
+ * @param {InternalDatArchive} archive
+ * @returns {Promise<Object>}
+ */
+async function readFollowsFile (archive) {
+  try {
+    var followsJson = await archive.pda.readFile(JSON_PATH, 'utf8')
+  } catch (e) {
+    if (e.notFound) return {type: JSON_TYPE, urls: []} // empty default when not found
+    throw e
+  }
+  followsJson = JSON.parse(followsJson)
+  var valid = validateFollows(followsJson)
+  if (!valid) throw ajv.errorsText(validateFollows.errors)
+  return followsJson
+}
+
+/**
+ * @param {InternalDatArchive} archive
+ * @param {function(Object): void} updateFn
+ * @returns {Promise<void>}
+ */
+async function updateFollowsFile (archive, updateFn) {
+  var release = await lock('crawler:follows:' + archive.url)
+  try {
+    // read the follows file
+    try {
+      var followsJson = await readFollowsFile(archive)
+    } catch (err) {
+      if (err.notFound) {
+        // create new
+        followsJson = {
+          type: JSON_TYPE,
+          urls: []
+        }
+      } else {
+        logger.warn('Failed to read follows file', {details: {url: archive.url, err}})
+        throw err
+      }
+    }
+
+    // apply update
+    updateFn(followsJson)
+
+    // write the follows file
+    await archive.pda.mkdir('/data').catch(err => undefined)
+    await archive.pda.writeFile(JSON_PATH, JSON.stringify(followsJson, null, 2), 'utf8')
+
+    // trigger crawl now
+    await crawler.crawlSite(archive)
+  } finally {
+    release()
+  }
+}
diff --git a/crawler/graph.js b/crawler/graph.js
deleted file mode 100644
index 3462fdf6..00000000
--- a/crawler/graph.js
+++ /dev/null
@@ -1,461 +0,0 @@
-const assert = require('assert')
-const _difference = require('lodash.difference')
-const Events = require('events')
-const {URL} = require('url')
-const Ajv = require('ajv')
-const logger = require('../logger').child({category: 'crawler', dataset: 'graph'})
-const lock = require('../lib/lock')
-const knex = require('../lib/knex')
-const db = require('../dbs/profile-data-db')
-const crawler = require('./index')
-const siteDescriptions = require('./site-descriptions')
-const {doCrawl, doCheckpoint, emitProgressEvent} = require('./util')
-const followsSchema = require('./json-schemas/follows')
-
-// constants
-// =
-
-const TABLE_VERSION = 1
-const JSON_TYPE = 'unwalled.garden/follows'
-const JSON_PATH = '/data/follows.json'
-
-// typedefs
-// =
-
-/**
- * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
- * @typedef {import('./util').CrawlSourceRecord} CrawlSourceRecord
- * @typedef {import('./site-descriptions').SiteDescription} SiteDescription
- *
- * @typedef {Object} GraphLink
- * @prop {string} type
- * @prop {SiteDescription} src
- * @prop {SiteDescription} dst
- * @prop {number} crawledAt
- */
-
-// globals
-// =
-
-const events = new Events()
-const ajv = (new Ajv())
-const validateFollows = ajv.compile(followsSchema)
-
-// exported api
-// =
-
-exports.on = events.on.bind(events)
-exports.addListener = events.addListener.bind(events)
-exports.removeListener = events.removeListener.bind(events)
-
-/**
- * @description
- * Crawl the given site for follows.
- *
- * @param {InternalDatArchive} archive - site to crawl.
- * @param {CrawlSourceRecord} crawlSource - internal metadata about the crawl target.
- * @returns {Promise<void>}
- */
-exports.crawlSite = async function (archive, crawlSource) {
-  return doCrawl(archive, crawlSource, 'crawl_graph', TABLE_VERSION, async ({changes, resetRequired}) => {
-    const supressEvents = resetRequired === true // dont emit when replaying old info
-    logger.silly('Crawling follows', {details: {url: archive.url, numChanges: changes.length, resetRequired}})
-    if (resetRequired) {
-      // reset all data
-      logger.debug('Resetting dataset', {details: {url: archive.url}})
-      await db.run(`
-        DELETE FROM crawl_graph WHERE crawlSourceId = ?
-      `, [crawlSource.id])
-      await doCheckpoint('crawl_graph', TABLE_VERSION, crawlSource, 0)
-    }
-
-    // did follows.json change?
-    var change = changes.find(c => c.name === JSON_PATH)
-    if (!change) {
-      logger.debug('No change detected to follows record', {details: {url: archive.url}})
-      if (changes.length) {
-        await doCheckpoint('crawl_graph', TABLE_VERSION, crawlSource, changes[changes.length - 1].version)
-      }
-      return
-    }
-
-    logger.verbose('Change detected to follows record', {details: {url: archive.url}})
-    emitProgressEvent(archive.url, 'crawl_graph', 0, 1)
-
-    // read and validate
-    try {
-      var followsJson = await readFollowsFile(archive)
-    } catch (err) {
-      logger.warn('Failed to read follows file', {details: {url: archive.url, err}})
-      return
-    }
-
-    // diff against the current follows
-    var currentFollows = /** @type string[] */(await listFollows(archive.url))
-    var newFollows = followsJson.urls
-    var adds = _difference(newFollows, currentFollows)
-    var removes = _difference(currentFollows, newFollows)
-    logger.silly(`Adding ${adds.length} follows and removing ${removes.length} follows`, {details: {url: archive.url}})
-
-    // write updates
-    for (let add of adds) {
-      try {
-        await db.run(`
-          INSERT INTO crawl_graph (crawlSourceId, destUrl, crawledAt) VALUES (?, ?, ?)
-        `, [crawlSource.id, add, Date.now()])
-      } catch (e) {
-        if (e.code === 'SQLITE_CONSTRAINT') {
-          // uniqueness constraint probably failed, which means we got a duplicate somehow
-          // dont worry about it
-          logger.warn('Attempted to insert duplicate graph record', {details: {url: archive.url, add}})
-        } else {
-          throw e
-        }
-      }
-      if (!supressEvents) {
-        events.emit('follow-added', archive.url, add)
-      }
-    }
-    for (let remove of removes) {
-      await db.run(`
-        DELETE FROM crawl_graph WHERE crawlSourceId = ? AND destUrl = ?
-      `, [crawlSource.id, remove])
-      if (supressEvents) {
-        events.emit('follow-removed', archive.url, remove)
-      }
-    }
-
-    // write checkpoint as success
-    logger.silly(`Finished crawling follows`, {details: {url: archive.url}})
-    await doCheckpoint('crawl_graph', TABLE_VERSION, crawlSource, changes[changes.length - 1].version)
-    emitProgressEvent(archive.url, 'crawl_graph', 1, 1)
-  })
-}
-
-/**
- * @description
- * List crawled graph links.
- *
- * @param {Object} [opts]
- * @param {Object} [opts.filters]
- * @param {string|string[]} [opts.filters.authors]
- * @param {number} [opts.offset=0]
- * @param {number} [opts.limit]
- * @param {boolean} [opts.reverse]
- * @returns {Promise<Array<GraphLink>>}
- */
-exports.query = async function (opts) {
-  // validate & parse params
-  if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
-  if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
-  if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
-  if (opts && opts.filters) {
-    if ('authors' in opts.filters) {
-      if (Array.isArray(opts.filters.authors)) {
-        assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
-      } else {
-        assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
-        opts.filters.authors = [opts.filters.authors]
-      }
-      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
-    }
-  }
-
-  // execute query
-  let sql = knex('crawl_graph')
-    .select('crawl_graph.*')
-    .select('crawl_sources.url AS srcUrl')
-    .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_graph.crawlSourceId')
-    .orderBy('crawl_graph.crawledAt', opts.reverse ? 'DESC' : 'ASC')
-  if (opts.limit) sql = sql.limit(opts.limit)
-  if (opts.offset) sql = sql.offset(opts.offset)
-  if (opts && opts.filters && opts.filters.authors) {
-    sql = sql.whereIn('crawl_sources.url', opts.filters.authors)
-  }
-  var rows = await db.all(sql)
-
-  // massage results
-  return Promise.all(rows.map(async (row) => {
-    var src = toOrigin(row.srcUrl)
-    var dst = toOrigin(row.destUrl)
-    return {
-      type: 'unwalled.garden/follows',
-      src: await siteDescriptions.getBest({subject: src}),
-      dst: await siteDescriptions.getBest({subject: dst}),
-      crawledAt: row.crawledAt
-    }
-  }))
-}
-
-/**
- * @description
- * List sites that follow subject.
- *
- * @param {string} subject - (URL)
- * @param {Object} [opts]
- * @param {string} [opts.followedBy] - (URL) filter results to those followed by the site specified with this param. Causes .followsUser boolean to be set.
- * @param {boolean} [opts.includeDesc] - output a site description instead of a simple URL.
- * @param {boolean} [opts.includeFollowers] - include .followedBy in the result. Requires includeDesc to be true.
- * @param {number} [opts.limit]
- * @param {number} [opts.offset]
- * @returns {Promise<Array<string|SiteDescription>>}
- */
-const listFollowers = exports.listFollowers = async function (subject, {followedBy, includeDesc, includeFollowers, offset, limit} = {}) {
-  offset = offset || 0
-  limit = limit || -1
-
-  var rows
-  if (followedBy) {
-    rows = await db.all(`
-      SELECT cs.url FROM crawl_graph fg
-        INNER JOIN crawl_sources cs ON cs.id = fg.crawlSourceId
-        WHERE fg.destUrl = ?
-          AND (cs.url = ? OR cs.url IN (
-            SELECT destUrl as url FROM crawl_graph
-              INNER JOIN crawl_sources ON crawl_sources.id = crawl_graph.crawlSourceId
-              WHERE crawl_sources.url = ?
-          ))
-        LIMIT ?
-        OFFSET ?
-    `, [subject, followedBy, followedBy, limit, offset])
-  } else {
-    rows = await db.all(`
-      SELECT f.url
-        FROM crawl_sources f
-        INNER JOIN crawl_graph
-          ON crawl_graph.crawlSourceId = f.id
-          AND crawl_graph.destUrl = ?
-        LIMIT ?
-        OFFSET ?
-    `, [subject, limit, offset])
-  }
-  if (!includeDesc) {
-    return rows.map(row => toOrigin(row.url))
-  }
-  return Promise.all(rows.map(async (row) => {
-    var url = toOrigin(row.url)
-    var desc = await siteDescriptions.getBest({subject: url})
-    desc.url = url
-    if (followedBy) {
-      desc.followsUser = await isAFollowingB(url, followedBy)
-    }
-    if (includeFollowers) {
-      desc.followedBy = /** @type Array<SiteDescription> */ (await listFollowers(url, {followedBy, includeDesc: true}))
-    }
-    return desc
-  }))
-}
-
-/**
- * @description
- * List sites that subject follows.
- *
- * @param {string} subject - (URL)
- * @param {Object} [opts]
- * @param {string} [opts.followedBy] - (URL) filter results to those followed by the site specified with this param. Causes .followsUser boolean to be set.
- * @param {boolean} [opts.includeDesc] - output a site description instead of a simple URL.
- * @param {boolean} [opts.includeFollowers] - include .followedBy in the result. Requires includeDesc to be true.
- * @param {number} [opts.limit]
- * @param {number} [opts.offset]
- * @returns {Promise<Array<SiteDescription | string>>}
- */
-const listFollows = exports.listFollows = async function (subject, {followedBy, includeDesc, includeFollowers, offset, limit} = {}) {
-  offset = offset || 0
-  limit = limit || -1
-
-  var rows = await db.all(`
-    SELECT crawl_graph.destUrl
-      FROM crawl_graph
-      INNER JOIN crawl_sources
-        ON crawl_graph.crawlSourceId = crawl_sources.id
-        AND crawl_sources.url = ?
-      LIMIT ?
-      OFFSET ?
-  `, [subject, limit, offset])
-  if (!includeDesc) {
-    return rows.map(row => toOrigin(row.destUrl))
-  }
-  return Promise.all(rows.map(async (row) => {
-    var url = toOrigin(row.destUrl)
-    var desc = /** @type SiteDescription */ ((await siteDescriptions.getBest({subject: url})) || {})
-    desc.url = url
-    if (followedBy) {
-      desc.followsUser = await isAFollowingB(url, followedBy)
-    }
-    if (includeFollowers) {
-      desc.followedBy = /** @type Array<SiteDescription> */ (await listFollowers(url, {followedBy, includeDesc: true}))
-    }
-    return desc
-  }))
-}
-
-/**
- * @description
- * List sites that are followed by sites that the subject follows.
- *
- * @param {string} subject - (URL)
- * @param {Object} [opts]
- * @param {string} [opts.followedBy] - (URL) filter results to those followed by the site specified with this param. Causes .followsUser boolean to be set.
- * @returns {Promise<Array<SiteDescription>>}
- */
-const listFoaFs = exports.listFoaFs = async function (subject, {followedBy} = {}) {
-  var foafs = []
-  // list URLs followed by subject
-  var follows = /** @type Array<SiteDescription> */ (await listFollows(subject, {followedBy, includeDesc: true}))
-  for (let follow of follows) {
-    // list follows of this follow
-    for (let foaf of /** @type Array<SiteDescription> */ (await listFollows(follow.url, {followedBy, includeDesc: true}))) {
-      // ignore if followed by subject or is subject
-      if (foaf.url === subject) continue
-      if (follows.find(v => v.url === foaf.url)) continue
-      // merge into list
-      let existingFoaF = foafs.find(v => v.url === foaf.url)
-      if (existingFoaF) {
-        existingFoaF.followedBy.push(follow)
-      } else {
-        foaf.followedBy = [follow]
-        foafs.push(foaf)
-      }
-    }
-  }
-  return foafs
-}
-
-/**
- * @description
- * Check for the existence of an individual follow.
- *
- * @param {string} a - (URL) the site being queried.
- * @param {string} b - (URL) does a follow this site?
- * @returns {Promise<boolean>}
- */
-const isAFollowingB = exports.isAFollowingB = async function (a, b) {
-  a = toOrigin(a)
-  b = toOrigin(b)
-  var res = await db.get(`
-    SELECT crawl_sources.id
-      FROM crawl_sources
-      INNER JOIN crawl_graph
-        ON crawl_graph.crawlSourceId = crawl_sources.id
-        AND crawl_graph.destUrl = ?
-      WHERE crawl_sources.url = ?
-  `, [b, a])
-  return !!res
-}
-
-/**
- * @description
- * Add a follow to the given archive.
- *
- * @param {InternalDatArchive} archive
- * @param {string} followUrl
- * @returns {Promise<void>}
- */
-exports.follow = async function (archive, followUrl) {
-  // normalize followUrl
-  followUrl = toOrigin(followUrl)
-  assert(typeof followUrl === 'string', 'Follow() must be given a valid URL')
-
-  // write new follows.json
-  await updateFollowsFile(archive, followsJson => {
-    if (!followsJson.urls.find(v => v === followUrl)) {
-      followsJson.urls.push(followUrl)
-    }
-  })
-
-  // capture site description
-  /* dont await */siteDescriptions.capture(archive, followUrl)
-}
-
-/**
- * @description
- * Remove a follow from the given archive.
- *
- * @param {InternalDatArchive} archive
- * @param {string} followUrl
- * @returns {Promise<void>}
- */
-exports.unfollow = async function (archive, followUrl) {
-  // normalize followUrl
-  followUrl = toOrigin(followUrl)
-  assert(typeof followUrl === 'string', 'Unfollow() must be given a valid URL')
-
-  // write new follows.json
-  await updateFollowsFile(archive, followsJson => {
-    var i = followsJson.urls.findIndex(v => v === followUrl)
-    if (i !== -1) {
-      followsJson.urls.splice(i, 1)
-    }
-  })
-}
-
-// internal methods
-// =
-
-/**
- * @param {string} url
- * @returns {string}
- */
-function toOrigin (url) {
-  try {
-    var urlParsed = new URL(url)
-    return urlParsed.protocol + '//' + urlParsed.hostname
-  } catch (e) {
-    return null
-  }
-}
-
-/**
- * @param {InternalDatArchive} archive
- * @returns {Promise<Object>}
- */
-async function readFollowsFile (archive) {
-  try {
-    var followsJson = await archive.pda.readFile(JSON_PATH, 'utf8')
-  } catch (e) {
-    if (e.notFound) return {type: JSON_TYPE, urls: []} // empty default when not found
-    throw e
-  }
-  followsJson = JSON.parse(followsJson)
-  var valid = validateFollows(followsJson)
-  if (!valid) throw ajv.errorsText(validateFollows.errors)
-  return followsJson
-}
-
-/**
- * @param {InternalDatArchive} archive
- * @param {function(Object): void} updateFn
- * @returns {Promise<void>}
- */
-async function updateFollowsFile (archive, updateFn) {
-  var release = await lock('crawler:graph:' + archive.url)
-  try {
-    // read the follows file
-    try {
-      var followsJson = await readFollowsFile(archive)
-    } catch (err) {
-      if (err.notFound) {
-        // create new
-        followsJson = {
-          type: JSON_TYPE,
-          urls: []
-        }
-      } else {
-        logger.warn('Failed to read follows file', {details: {url: archive.url, err}})
-        throw err
-      }
-    }
-
-    // apply update
-    updateFn(followsJson)
-
-    // write the follows file
-    await archive.pda.mkdir('/data').catch(err => undefined)
-    await archive.pda.writeFile(JSON_PATH, JSON.stringify(followsJson, null, 2), 'utf8')
-
-    // trigger crawl now
-    await crawler.crawlSite(archive)
-  } finally {
-    release()
-  }
-}
diff --git a/crawler/index.js b/crawler/index.js
index 52425eb4..9285a515 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -9,7 +9,7 @@ const dat = require('../dat')
 const {crawlerEvents, toHostname} = require('./util')
 const posts = require('./posts')
 const bookmarks = require('./bookmarks')
-const graph = require('./graph')
+const follows = require('./follows')
 const reactions = require('./reactions')
 const siteDescriptions = require('./site-descriptions')
 
@@ -23,7 +23,7 @@ var watches = {}
 
 exports.posts = posts
 exports.bookmarks = bookmarks
-exports.graph = graph
+exports.follows = follows
 exports.reactions = reactions
 exports.siteDescriptions = siteDescriptions
 const createEventsStream = exports.createEventsStream = () => emitStream(crawlerEvents)
@@ -87,7 +87,7 @@ exports.crawlSite = async function (archive) {
     await Promise.all([
       posts.crawlSite(archive, crawlSource),
       bookmarks.crawlSite(archive, crawlSource),
-      graph.crawlSite(archive, crawlSource),
+      follows.crawlSite(archive, crawlSource),
       reactions.crawlSite(archive, crawlSource),
       siteDescriptions.crawlSite(archive, crawlSource)
     ])
diff --git a/crawler/search.js b/crawler/search.js
index 9fc2ebbe..c88448f9 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -4,7 +4,7 @@ const db = require('../dbs/profile-data-db')
 const bookmarksDb = require('../dbs/bookmarks')
 const historyDb = require('../dbs/history')
 const datLibrary = require('../dat/library')
-const graph = require('./graph')
+const follows = require('./follows')
 const siteDescriptions = require('./site-descriptions')
 const {getSiteDescriptionThumbnailUrl} = require('./util')
 const knex = require('../lib/knex')
@@ -98,7 +98,7 @@ exports.listSuggestions = async function (user, query = '', opts = {}) {
   suggestions.builtins = BUILTIN_PAGES.filter(a => query ? a.title.toLowerCase().includes(query) : true)
 
   // addressbook
-  suggestions.addressbook = await graph.listFollows(user, {includeDesc: true})
+  suggestions.addressbook = (await follows.list({filters: {authors: user}})).map(({subject}) => subject)
   suggestions.addressbook = [await siteDescriptions.getBest({subject: user, author: user})].concat(suggestions.addressbook)
   suggestions.addressbook = suggestions.addressbook.filter(filterFn)
 
@@ -188,7 +188,7 @@ exports.query = async function (user, opts) {
     // the user and all followed sources
     let res = await db.all(`
       SELECT id FROM crawl_sources src
-        INNER JOIN crawl_graph graph ON graph.destUrl = src.url AND graph.crawlSourceId = ?
+        INNER JOIN crawl_follows follows ON follows.destUrl = src.url AND follows.crawlSourceId = ?
     `, [userCrawlSourceId])
     crawlSourceIds = [userCrawlSourceId].concat(res.map(({id}) => id))
   } else if (hops === 1) {
@@ -261,7 +261,7 @@ function buildSitesSearchQuery ({query, crawlSourceIds, user, userCrawlSourceId,
     .select('crawl_sources.url AS authorUrl')
     .select('crawl_site_descriptions.crawledAt')
     .where(builder => builder
-      .whereIn('crawl_graph.crawlSourceId', crawlSourceIds) // description by a followed user
+      .whereIn('crawl_follows.crawlSourceId', crawlSourceIds) // description by a followed user
       .orWhere(builder => builder
         .where('crawl_site_descriptions.url', user) // about me and...
         .andWhere('crawl_site_descriptions.crawlSourceId', userCrawlSourceId) // by me
@@ -276,14 +276,14 @@ function buildSitesSearchQuery ({query, crawlSourceIds, user, userCrawlSourceId,
       .select(knex.raw(`SNIPPET(crawl_site_descriptions_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title`))
       .select(knex.raw(`SNIPPET(crawl_site_descriptions_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description`))
       .innerJoin('crawl_site_descriptions', 'crawl_site_descriptions.rowid', '=', 'crawl_site_descriptions_fts_index.rowid')
-      .leftJoin('crawl_graph', 'crawl_graph.destUrl', '=', 'crawl_site_descriptions.url')
+      .leftJoin('crawl_follows', 'crawl_follows.destUrl', '=', 'crawl_site_descriptions.url')
       .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_site_descriptions.crawlSourceId')
       .whereRaw('crawl_site_descriptions_fts_index MATCH ?', [query])
   } else {
     sql = sql
       .select('crawl_site_descriptions.title')
       .select('crawl_site_descriptions.description')
-      .leftJoin('crawl_graph', 'crawl_graph.destUrl', '=', 'crawl_site_descriptions.url')
+      .leftJoin('crawl_follows', 'crawl_follows.destUrl', '=', 'crawl_site_descriptions.url')
       .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_site_descriptions.crawlSourceId')
   }
   return sql
@@ -297,7 +297,7 @@ function buildPostsSearchQuery ({query, crawlSourceIds, userCrawlSourceId, since
     .select('crawl_posts.updatedAt')
     .select('crawl_sources.url AS authorUrl')
     .where(builder => builder
-      .whereIn('crawl_graph.crawlSourceId', crawlSourceIds) // published by someone I follow
+      .whereIn('crawl_follows.crawlSourceId', crawlSourceIds) // published by someone I follow
       .orWhere('crawl_posts.crawlSourceId', userCrawlSourceId) // or by me
     )
     .andWhere('crawl_posts.crawledAt', '>=', since)
@@ -309,13 +309,13 @@ function buildPostsSearchQuery ({query, crawlSourceIds, userCrawlSourceId, since
       .select(knex.raw(`SNIPPET(crawl_posts_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS body`))
       .innerJoin('crawl_posts', 'crawl_posts.rowid', '=', 'crawl_posts_fts_index.rowid')
       .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_posts.crawlSourceId')
-      .leftJoin('crawl_graph', 'crawl_graph.destUrl', '=', 'crawl_sources.url')
+      .leftJoin('crawl_follows', 'crawl_follows.destUrl', '=', 'crawl_sources.url')
       .whereRaw('crawl_posts_fts_index MATCH ?', [query])
   } else {
     sql = sql
       .select('crawl_posts.body')
       .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_posts.crawlSourceId')
-      .leftJoin('crawl_graph', 'crawl_graph.destUrl', '=', 'crawl_sources.url')
+      .leftJoin('crawl_follows', 'crawl_follows.destUrl', '=', 'crawl_sources.url')
   }
   return sql
 }
@@ -328,7 +328,7 @@ function buildBookmarksSearchQuery ({query, crawlSourceIds, userCrawlSourceId, s
     .select('crawl_bookmarks.updatedAt')
     .select('crawl_sources.url AS authorUrl')
     .where(builder => builder
-      .whereIn('crawl_graph.crawlSourceId', crawlSourceIds) // published by someone I follow
+      .whereIn('crawl_follows.crawlSourceId', crawlSourceIds) // published by someone I follow
       .orWhere('crawl_bookmarks.crawlSourceId', userCrawlSourceId) // or by me
     )
     .andWhere('crawl_bookmarks.crawledAt', '>=', since)
@@ -343,7 +343,7 @@ function buildBookmarksSearchQuery ({query, crawlSourceIds, userCrawlSourceId, s
       .select(knex.raw(`SNIPPET(crawl_bookmarks_fts_index, 2, '${startHighlight}', '${endHighlight}', '...', 25) AS tags`))
       .innerJoin('crawl_bookmarks', 'crawl_bookmarks.rowid', '=', 'crawl_bookmarks_fts_index.rowid')
       .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_bookmarks.crawlSourceId')
-      .leftJoin('crawl_graph', 'crawl_graph.destUrl', '=', 'crawl_sources.url')
+      .leftJoin('crawl_follows', 'crawl_follows.destUrl', '=', 'crawl_sources.url')
       .whereRaw('crawl_bookmarks_fts_index MATCH ?', [query])
   } else {
     sql = sql
@@ -352,7 +352,7 @@ function buildBookmarksSearchQuery ({query, crawlSourceIds, userCrawlSourceId, s
       .select('crawl_bookmarks.description')
       .select('crawl_bookmarks.tags')
       .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_bookmarks.crawlSourceId')
-      .leftJoin('crawl_graph', 'crawl_graph.destUrl', '=', 'crawl_sources.url')
+      .leftJoin('crawl_follows', 'crawl_follows.destUrl', '=', 'crawl_sources.url')
   }
   return sql
 }
diff --git a/dbs/profile-data-db.js b/dbs/profile-data-db.js
index 57755a57..b2cc18d3 100644
--- a/dbs/profile-data-db.js
+++ b/dbs/profile-data-db.js
@@ -112,7 +112,8 @@ migrations = [
   migration('profile-data.v22.sql', {canFail: true}), // canFail for the same reason as v16, ffs
   migration('profile-data.v23.sql'),
   migration('profile-data.v24.sql'),
-  migration('profile-data.v25.sql')
+  migration('profile-data.v25.sql'),
+  migration('profile-data.v26.sql')
 ]
 function migration (file, opts = {}) {
   return cb => {
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index af6b5b43..bb0f1196 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -153,7 +153,7 @@ CREATE TRIGGER crawl_site_descriptions_ad AFTER DELETE ON crawl_site_description
   INSERT INTO crawl_site_descriptions_fts_index(crawl_site_descriptions_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
 END;
 CREATE TRIGGER crawl_site_descriptions_au AFTER UPDATE ON crawl_site_descriptions BEGIN
-  INSERT INTO crawl_site_descriptions_fts_index(crawl_site_descriptions_fts_index, rowid, title, description) VALUES('delete', old.a, old.title, old.description);
+  INSERT INTO crawl_site_descriptions_fts_index(crawl_site_descriptions_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
   INSERT INTO crawl_site_descriptions_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
 END;
 
@@ -227,7 +227,7 @@ CREATE TRIGGER crawl_bookmarks_au AFTER UPDATE ON crawl_bookmarks BEGIN
 END;
 
 -- crawled follows
-CREATE TABLE crawl_graph (
+CREATE TABLE crawl_follows (
   crawlSourceId INTEGER NOT NULL,
   crawledAt INTEGER,
   
@@ -300,5 +300,5 @@ INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Library', 'beaker://library/', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker.Social', 'dat://beaker.social', 1);
 
-PRAGMA user_version = 25;
+PRAGMA user_version = 26;
 `
diff --git a/dbs/schemas/profile-data.v26.sql.js b/dbs/schemas/profile-data.v26.sql.js
new file mode 100644
index 00000000..4a49cf39
--- /dev/null
+++ b/dbs/schemas/profile-data.v26.sql.js
@@ -0,0 +1,14 @@
+module.exports = `
+
+-- fix an incorrect trigger definition
+DROP TRIGGER crawl_site_descriptions_au;
+CREATE TRIGGER crawl_site_descriptions_au AFTER UPDATE ON crawl_site_descriptions BEGIN
+  INSERT INTO crawl_site_descriptions_fts_index(crawl_site_descriptions_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
+  INSERT INTO crawl_site_descriptions_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
+END;
+
+-- rename 'graph' to 'follows'
+ALTER TABLE crawl_graph RENAME TO crawl_follows;
+
+PRAGMA user_version = 26;
+`
diff --git a/lib/db.js b/lib/db.js
index 503b23df..58665e03 100644
--- a/lib/db.js
+++ b/lib/db.js
@@ -81,7 +81,11 @@ exports.setupSqliteDB = function (db, {setup, migrations}, logTag) {
       logger.info(`${logTag} Database at version ${version}; Running ${neededMigrations.length} migrations`)
       runNeededMigrations()
       function runNeededMigrations (err) {
-        if (err) return reject(err)
+        if (err) {
+          logger.error(`${logTag} Failed migration`)
+          console.log(err)
+          return reject(err)
+        }
 
         var migration = neededMigrations.shift()
         if (!migration) {
diff --git a/package-lock.json b/package-lock.json
index 759a29c1..26cee3a8 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -32,9 +32,9 @@
       "integrity": "sha512-UMOvwf+efn01go0fV/JqAZIgrrObphXwdROgCoPZM+g6iCzeoA9G2vQwfULuw5W4XGHIj+Ro689zFNKfRXTHiw=="
     },
     "@types/bluebird": {
-      "version": "3.5.26",
-      "resolved": "https://registry.npmjs.org/@types/bluebird/-/bluebird-3.5.26.tgz",
-      "integrity": "sha512-aj2mrBLn5ky0GmAg6IPXrQjnN0iB/ulozuJ+oZdrHRAzRbXjGmu4UXsNCjFvPbSaaPZmniocdOzsM392qLOlmQ=="
+      "version": "3.5.27",
+      "resolved": "https://registry.npmjs.org/@types/bluebird/-/bluebird-3.5.27.tgz",
+      "integrity": "sha512-6BmYWSBea18+tSjjSC3QIyV93ZKAeNWGM7R6aYt1ryTZXrlHF+QLV0G2yV0viEGVyRkyQsWfMoJ0k/YghBX5sQ=="
     },
     "@types/node": {
       "version": "12.0.1",
@@ -421,9 +421,9 @@
       }
     },
     "bluebird": {
-      "version": "3.5.4",
-      "resolved": "https://registry.npmjs.org/bluebird/-/bluebird-3.5.4.tgz",
-      "integrity": "sha512-FG+nFEZChJrbQ9tIccIfZJBz3J7mLrAhxakAbnrJWn8d7aKOC+LWifa0G+p4ZqKp4y13T7juYvdhq9NzKdsrjw=="
+      "version": "3.5.5",
+      "resolved": "https://registry.npmjs.org/bluebird/-/bluebird-3.5.5.tgz",
+      "integrity": "sha512-5am6HnnfN+urzt4yfg7IgTbotDjIT/u8AJpEt0sIU9FtXfVeezXAPKswrG+xKUCOYAINpSdgZVDU6QFh+cuH3w=="
     },
     "bmp-js": {
       "version": "0.1.0",
@@ -705,9 +705,9 @@
       }
     },
     "colorette": {
-      "version": "1.0.7",
-      "resolved": "https://registry.npmjs.org/colorette/-/colorette-1.0.7.tgz",
-      "integrity": "sha512-KeK4klsvAgdODAjFPm6QLzvStizJqlxMBtVo4KQMCgk5tt/tf9rAzxmxLHNRynJg3tJjkKGKbHx3j4HLox27Lw=="
+      "version": "1.0.8",
+      "resolved": "https://registry.npmjs.org/colorette/-/colorette-1.0.8.tgz",
+      "integrity": "sha512-X6Ck90ReaF+EfKdVGB7vdIQ3dr651BbIrBwY5YBKg13fjH+940sTtp7/Pkx33C6ntYfQcRumOs/aUQhaRPpbTQ=="
     },
     "colornames": {
       "version": "1.1.1",
@@ -778,9 +778,9 @@
       "integrity": "sha1-Z29us8OZl8LuGsOpJP1hJHSPV40="
     },
     "core-js": {
-      "version": "2.6.5",
-      "resolved": "https://registry.npmjs.org/core-js/-/core-js-2.6.5.tgz",
-      "integrity": "sha512-klh/kDpwX8hryYL14M9w/xei6vrv6sE8gTHDG7/T/+SEovB/G4ejwcfE/CBzO6Edsu+OETZMZ3wcX/EjUkrl5A=="
+      "version": "2.6.9",
+      "resolved": "https://registry.npmjs.org/core-js/-/core-js-2.6.9.tgz",
+      "integrity": "sha512-HOpZf6eXmnl7la+cUdMnLvUxKNqLUzJvgIziQ0DiF3JwSImNphIqdGqzj6hIKyX04MmV0poclQ7+wjWvxQyR2A=="
     },
     "core-util-is": {
       "version": "1.0.2",
@@ -1795,9 +1795,9 @@
       "integrity": "sha1-3BXKHGcjh8p2vTesCjlbogQqLCg="
     },
     "getopts": {
-      "version": "2.2.3",
-      "resolved": "https://registry.npmjs.org/getopts/-/getopts-2.2.3.tgz",
-      "integrity": "sha512-viEcb8TpgeG05+Nqo5EzZ8QR0hxdyrYDp6ZSTZqe2M/h53Bk036NmqG38Vhf5RGirC/Of9Xql+v66B2gp256SQ=="
+      "version": "2.2.4",
+      "resolved": "https://registry.npmjs.org/getopts/-/getopts-2.2.4.tgz",
+      "integrity": "sha512-Rz7DGyomZjrenu9Jx4qmzdlvJgvrEFHXHvjK0FcZtcTC1U5FmES7OdZHUwMuSnEE6QvBvwse1JODKj7TgbSEjQ=="
     },
     "getpass": {
       "version": "0.1.7",
@@ -2590,17 +2590,17 @@
       "integrity": "sha512-s5kLOcnH0XqDO+FvuaLX8DDjZ18CGFk7VygH40QoKPUQhW4e2rvM0rwUq0t8IQDOwYSeLK01U90OjzBTme2QqA=="
     },
     "knex": {
-      "version": "0.16.5",
-      "resolved": "https://registry.npmjs.org/knex/-/knex-0.16.5.tgz",
-      "integrity": "sha512-1RVxMU8zGOBqgmXlAvs8vohg9MD14iiRZZPe0IeQXd554n4xxPmoMkbH4hlFeqfM6eOdFE3AVqVSncL3YuocqA==",
-      "requires": {
-        "@babel/polyfill": "^7.4.3",
-        "@types/bluebird": "^3.5.26",
-        "bluebird": "^3.5.4",
-        "colorette": "1.0.7",
+      "version": "0.17.5",
+      "resolved": "https://registry.npmjs.org/knex/-/knex-0.17.5.tgz",
+      "integrity": "sha512-2BUau9Mg7vE+Isl2MfRhw+XtusTdAj9K5dSzor4N1yxHMLCfvPLIEY7Gmyq4QIz51cLRBNoQETyygdCE9BOmxw==",
+      "requires": {
+        "@babel/polyfill": "^7.4.4",
+        "@types/bluebird": "^3.5.27",
+        "bluebird": "^3.5.5",
+        "colorette": "1.0.8",
         "commander": "^2.20.0",
         "debug": "4.1.1",
-        "getopts": "2.2.3",
+        "getopts": "2.2.4",
         "inherits": "~2.0.3",
         "interpret": "^1.2.0",
         "liftoff": "3.1.0",
@@ -2610,7 +2610,7 @@
         "tarn": "^1.1.5",
         "tildify": "1.2.0",
         "uuid": "^3.3.2",
-        "v8flags": "^3.1.2"
+        "v8flags": "^3.1.3"
       },
       "dependencies": {
         "debug": {
@@ -2975,9 +2975,9 @@
       "integrity": "sha512-bV7f+6l2QigeBBZSM/6yTNq4P2fNpSWj/0e7jQcy87A8e7o2nAfP/34/2ky5Vw4B9S446EtIhodAzkFCcR4dQg=="
     },
     "ms": {
-      "version": "2.1.1",
-      "resolved": "https://registry.npmjs.org/ms/-/ms-2.1.1.tgz",
-      "integrity": "sha512-tgp+dl5cGk28utYktBsrFqA7HKgrhgPsg6Z/EfhWI4gl1Hwq8B/GmY/0oXZ6nF8hDVesS/FpnYaD/kOWhYQvyg=="
+      "version": "2.1.2",
+      "resolved": "https://registry.npmjs.org/ms/-/ms-2.1.2.tgz",
+      "integrity": "sha512-sGkPx+VjMtmA6MX27oA4FBFELFCZZ4S4XqeGOXCv68tT+jb3vk/RyaKWP0PTKyWtmLSM0b+adUTEvbs1PEaH2w=="
     },
     "multicast-dns": {
       "version": "7.2.0",
@@ -3692,9 +3692,9 @@
       "integrity": "sha512-N5ZAX4/LxJmF+7wN74pUD6qAh9/wnvdQcjq9TZjevvXzSUo7bfmw91saqMjzGS2xq91/odN2dW/WOl7qQHNDGA=="
     },
     "random-access-file": {
-      "version": "2.1.2",
-      "resolved": "https://registry.npmjs.org/random-access-file/-/random-access-file-2.1.2.tgz",
-      "integrity": "sha512-dZo7HEcEPbZ/6XLXC4GXypiWvFbXVkdeMrJTi0B94pBJwddt/AvJh8GaQhso6KGYROGYCI/VWdHbmRDtkwT9pQ==",
+      "version": "2.1.3",
+      "resolved": "https://registry.npmjs.org/random-access-file/-/random-access-file-2.1.3.tgz",
+      "integrity": "sha512-AE0Z1ywR5gIkzACMC1lCsR6LP8g4ynNm7oYWYdKPSSU6Y3H+mGDJxBqfcV9B9KstfHNemhfX3nYmx99ZC9f/yg==",
       "requires": {
         "mkdirp": "^0.5.1",
         "random-access-storage": "^1.1.1"
@@ -3871,9 +3871,9 @@
       }
     },
     "resolve": {
-      "version": "1.10.1",
-      "resolved": "https://registry.npmjs.org/resolve/-/resolve-1.10.1.tgz",
-      "integrity": "sha512-KuIe4mf++td/eFb6wkaPbMDnP6kObCaEtIDuHOUED6MNUo4K670KZUHuuvYPZDxNF0WVLw49n06M2m2dXphEzA==",
+      "version": "1.11.0",
+      "resolved": "https://registry.npmjs.org/resolve/-/resolve-1.11.0.tgz",
+      "integrity": "sha512-WL2pBDjqT6pGUNSUzMw00o4T7If+z4H2x3Gz893WoUQ5KW8Vr9txp00ykiP16VBaZF5+j/OcXJHZ9+PCvdiDKw==",
       "requires": {
         "path-parse": "^1.0.6"
       }
diff --git a/package.json b/package.json
index 69c7ae8d..2942d1d7 100644
--- a/package.json
+++ b/package.json
@@ -52,7 +52,7 @@
     "icojs": "^0.12.3",
     "identify-filetype": "^1.0.0",
     "into-stream": "^3.1.0",
-    "knex": "^0.16.3",
+    "knex": "^0.17.5",
     "lodash.debounce": "^4.0.8",
     "lodash.difference": "^4.5.0",
     "lodash.get": "^4.4.2",
@@ -65,7 +65,7 @@
     "mime": "^1.4.0",
     "mkdirp": "^0.5.1",
     "moment": "^2.24.0",
-    "ms": "^2.1.1",
+    "ms": "^2.1.2",
     "normalize-url": "^3.3.0",
     "once": "^1.4.0",
     "os-locale": "^3.1.0",
@@ -73,7 +73,7 @@
     "pauls-dat-api": "^8.1.0",
     "pify": "^3.0.0",
     "pump": "^3.0.0",
-    "random-access-file": "^2.1.2",
+    "random-access-file": "^2.1.3",
     "random-access-indexed-file": "^2.0.0",
     "range-parser": "^1.2.0",
     "rimraf": "^2.6.3",
diff --git a/users/index.js b/users/index.js
index d18864d7..a8b2d370 100644
--- a/users/index.js
+++ b/users/index.js
@@ -2,7 +2,7 @@ const Events = require('events')
 const logger = require('../logger').category('crawler')
 const dat = require('../dat')
 const crawler = require('../crawler')
-const graphCrawler = require('../crawler/graph')
+const followsCrawler = require('../crawler/follows')
 const bookmarksCrawler = require('../crawler/bookmarks')
 const db = require('../dbs/profile-data-db')
 const archivesDb = require('../dbs/archives')
@@ -250,10 +250,12 @@ async function selectNextCrawlTargets (user) {
   var rows = [user.url]
 
   // get followed sites
-  rows = rows.concat(await graphCrawler.listFollows(user.url))
+  var followedUrls = (await followsCrawler.list({filters: {authors: user.url}})).map(({subject}) => subject.url)
+  rows = rows.concat(followedUrls)
 
   // get sites followed by followed sites
-  rows = rows.concat(await graphCrawler.listFoaFs(user.url))
+  var foafUrls = (await followsCrawler.list({filters: {authors: followedUrls}})).map(({subject}) => subject.url)
+  rows = rows.concat(foafUrls)
 
   // assemble into list
   var start = user.crawlSelectorCursor || 0
diff --git a/web-apis/bg.js b/web-apis/bg.js
index 78935cc2..5680516c 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -30,7 +30,7 @@ const libraryManifest = require('./manifests/external/library')
 const profilesManifest = require('./manifests/external/profiles')
 const searchManifest = require('./manifests/external/search')
 const postsManifest = require('./manifests/external/unwalled-garden-posts')
-const graphManifest = require('./manifests/external/unwalled-garden-graph')
+const followsManifest = require('./manifests/external/unwalled-garden-follows')
 const reactionsManifest = require('./manifests/external/unwalled-garden-reactions')
 
 // external apis
@@ -41,7 +41,7 @@ const libraryAPI = require('./bg/library')
 const profilesAPI = require('./bg/profiles')
 const searchAPI = require('./bg/search')
 const postsAPI = require('./bg/unwalled-garden-posts')
-const graphAPI = require('./bg/unwalled-garden-graph')
+const followsAPI = require('./bg/unwalled-garden-follows')
 const reactionsAPI = require('./bg/unwalled-garden-reactions')
 
 // experimental manifests
@@ -77,7 +77,7 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('profiles', profilesManifest, profilesAPI, secureOnly)
   globals.rpcAPI.exportAPI('search', searchManifest, searchAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-posts', postsManifest, postsAPI, secureOnly)
-  globals.rpcAPI.exportAPI('unwalled-garden-graph', graphManifest, graphAPI, secureOnly)
+  globals.rpcAPI.exportAPI('unwalled-garden-follows', followsManifest, followsAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-reactions', reactionsManifest, reactionsAPI, secureOnly)
 
   // experimental apis
diff --git a/web-apis/bg/unwalled-garden-follows.js b/web-apis/bg/unwalled-garden-follows.js
new file mode 100644
index 00000000..c1dfcca2
--- /dev/null
+++ b/web-apis/bg/unwalled-garden-follows.js
@@ -0,0 +1,192 @@
+const globals = require('../../globals')
+const assert = require('assert')
+const {URL} = require('url')
+const {PermissionsError} = require('beaker-error-constants')
+const dat = require('../../dat')
+const followsCrawler = require('../../crawler/follows')
+
+// typedefs
+// =
+
+/**
+ * @typedef {Object} FollowsSitePublicAPIRecord
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {string[]} type
+ *
+ * @typedef {Object} FollowsPublicAPIRecord
+ * @prop {FollowsSitePublicAPIRecord} author
+ * @prop {FollowsSitePublicAPIRecord} subject
+ * @prop {string} visibility
+ */
+
+// exported api
+// =
+
+module.exports = {
+  /**
+   * @param {Object} [opts]
+   * @param {Object} [opts.filters]
+   * @param {string|string[]} [opts.filters.authors]
+   * @param {string|string[]} [opts.filters.subjects]
+   * @param {string} [opts.filters.visibility]
+   * @param {string} [opts.sortBy]
+   * @param {number} [opts.offset=0]
+   * @param {number} [opts.limit]
+   * @param {boolean} [opts.reverse]
+   * @returns {Promise<FollowsPublicAPIRecord[]>}
+   */
+  async list (opts) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    opts = (opts && typeof opts === 'object') ? opts : {}
+    if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
+    if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+    if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+    if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+    if (opts && opts.filters) {
+      if ('authors' in opts.filters) {
+        if (Array.isArray(opts.filters.authors)) {
+          assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        }
+      }
+      if ('subjects' in opts.filters) {
+        if (Array.isArray(opts.filters.subjects)) {
+          assert(opts.filters.subjects.every(v => typeof v === 'string'), 'Subjects filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.subjects === 'string', 'Subjects filter must be a string or array of strings')
+        }
+      }
+      if ('visibility' in opts.filters) {
+        assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+      }
+    }
+    var links = await followsCrawler.list(opts)
+    return Promise.all(links.map(massageFollowRecord))
+  },
+
+  /**
+   * @param {string} author
+   * @param {string} subject
+   * @returns {Promise<FollowsPublicAPIRecord>}
+   */
+  async get (author, subject) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+
+    author = normalizeFollowUrl(author)
+    subject = normalizeFollowUrl(subject)
+
+    assert(author, 'The `author` parameter must be a valid URL')
+    assert(subject, 'The `subject` parameter must be a valid URL')
+
+    return followsCrawler.get(author, subject)
+  },
+
+  /**
+   * @param {string} subject
+   * @param {Object} [opts]
+   * @param {string} [opts.visibility]
+   * @returns {Promise<void>}
+   */
+  async add (subject, opts) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    var userArchive = getUserArchive(this.sender)
+
+    subject = normalizeFollowUrl(subject)
+    if (!opts) opts = {}
+    if (!opts.visibility) opts.visibility = 'public'
+    assert(subject, 'The `subject` parameter must be a valid URL')
+    assert(['public', 'private'].includes(opts.visibility), 'The `visibility` parameter must be "public" or "private"')
+
+    await followsCrawler.add(userArchive, subject, opts)
+  },
+
+  /**
+   * @param {string} subject
+   * @param {Object} [opts]
+   * @param {string} [opts.visibility]
+   * @returns {Promise<void>}
+   */
+  async edit (subject, opts) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    var userArchive = getUserArchive(this.sender)
+
+    subject = normalizeFollowUrl(subject)
+    if (!opts) opts = {}
+    if (!opts.visibility) opts.visibility = 'public'
+    assert(subject, 'The `subject` parameter must be a valid URL')
+    assert(['public', 'private'].includes(opts.visibility), 'The `visibility` parameter must be "public" or "private"')
+
+    await followsCrawler.edit(userArchive, subject, opts)
+  },
+
+  /**
+   * @param {string} subject
+   * @returns {Promise<void>}
+   */
+  async remove (subject) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    var userArchive = getUserArchive(this.sender)
+
+    subject = normalizeFollowUrl(subject)
+    assert(subject, 'The `subject` parameter must be a valid URL')
+
+    await followsCrawler.remove(userArchive, subject)
+  }
+}
+
+// internal methods
+// =
+
+async function assertPermission (sender, perm) {
+  if (sender.getURL().startsWith('beaker:')) {
+    return true
+  }
+  if (await globals.permsAPI.requestPermission(perm, sender)) return true
+  throw new PermissionsError()
+}
+
+function getUserArchive (sender) {
+  var userSession = globals.userSessionAPI.getFor(this.sender)
+  if (!userSession) throw new Error('No active user session')
+  return dat.library.getArchive(userSession.url)
+}
+
+/**
+ * @param {string} url
+ * @returns {string}
+ */
+function normalizeFollowUrl (url) {
+  try {
+    url = new URL(url)
+    return url.protocol + '//' + url.hostname
+  } catch (e) {}
+  return null
+}
+
+/**
+ * @param {Object} follow
+ * @returns {FollowsSitePublicAPIRecord}
+ */
+function massageSiteRecord (site) {
+  return {
+    url: site.url,
+    title: site.title,
+    description: site.description,
+    type: site.type
+  }
+}
+
+/**
+ * @param {Object} follow
+ * @returns {FollowsPublicAPIRecord}
+ */
+function massageFollowRecord (follow) {
+  return {
+    author: massageSiteRecord(follow.author),
+    subject: massageSiteRecord(follow.subject),
+    visibility: follow.visibility
+  }
+}
\ No newline at end of file
diff --git a/web-apis/bg/unwalled-garden-graph.js b/web-apis/bg/unwalled-garden-graph.js
deleted file mode 100644
index c2474952..00000000
--- a/web-apis/bg/unwalled-garden-graph.js
+++ /dev/null
@@ -1,218 +0,0 @@
-const globals = require('../../globals')
-const assert = require('assert')
-const {URL} = require('url')
-const {PermissionsError} = require('beaker-error-constants')
-const dat = require('../../dat')
-const graphCrawler = require('../../crawler/graph')
-
-// typedefs
-// =
-
-/**
- * @typedef {Object} GraphSitePublicAPIRecord
- * @prop {string} url
- * @prop {string} title
- * @prop {string} description
- * @prop {string[]} type
- *
- * @typedef {Object} GraphLinkPublicAPIRecord
- * @prop {string} type
- * @prop {GraphSitePublicAPIRecord} src
- * @prop {GraphSitePublicAPIRecord} dst
- * @prop {number} crawledAt
- */
-
-// exported api
-// =
-
-module.exports = {
-  /**
-   * @param {Object} [opts]
-   * @param {Object} [opts.filters]
-   * @param {string|string[]} [opts.filters.authors]
-   * @param {number} [opts.offset=0]
-   * @param {number} [opts.limit]
-   * @param {boolean} [opts.reverse]
-   * @returns {Promise<GraphLinkPublicAPIRecord[]>}
-   */
-  async query (opts) {
-    await assertPermission(this.sender, 'dangerousAppControl')
-    opts = (opts && typeof opts === 'object') ? opts : {}
-    if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
-    if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
-    if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
-    if (opts && opts.filters) {
-      if ('authors' in opts.filters) {
-        if (Array.isArray(opts.filters.authors)) {
-          assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
-        } else {
-          assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
-        }
-      }
-    }
-    var links = await graphCrawler.query(opts)
-    return Promise.all(links.map(massageLinkRecord))
-  },
-
-  /**
-   * @param {string} url
-   * @param {Object} [opts]
-   * @param {Object} [opts.filters]
-   * @param {string} [opts.filters.followedBy]
-   * @param {number} [opts.offset]
-   * @param {number} [opts.limit]
-   * @returns {Promise<GraphSitePublicAPIRecord[]>}
-   */
-  async listFollowers (url, opts) {
-    await assertPermission(this.sender, 'dangerousAppControl')
-
-    var query = {}
-    url = normalizeFollowUrl(url)
-    opts = (opts && typeof opts === 'object') ? opts : {}
-    assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
-    if (opts && 'offset' in opts) {
-      assert(typeof opts.offset === 'number', 'Offset must be a number')
-      query.offset = opts.offset
-    }
-    if (opts && 'limit' in opts) {
-      assert(typeof opts.limit === 'number', 'Limit must be a number')
-      query.limit = opts.limit
-    }
-    if (opts && opts.filters) {
-      if ('followedBy' in opts.filters) {
-        opts.filters.followedBy = normalizeFollowUrl(opts.filters.followedBy)
-        assert(typeof opts.filters.followedBy === 'string', 'Followed-by filter must be a valid URL')
-        query.followedBy = opts.filters.followedBy
-      }
-    }
-
-    query.includeDesc = true
-    var followers = await graphCrawler.listFollowers(url, query)
-    return followers.map(massageSiteRecord)
-  },
-
-  /**
-   * @param {string} url
-   * @param {Object} [opts]
-   * @param {Object} [opts.filters]
-   * @param {string} [opts.filters.followedBy]
-   * @param {number} [opts.offset]
-   * @param {number} [opts.limit]
-   * @returns {Promise<GraphSitePublicAPIRecord[]>}
-   */
-  async listFollows (url, opts) {
-    await assertPermission(this.sender, 'dangerousAppControl')
-
-    var query = {}
-    url = normalizeFollowUrl(url)
-    opts = (opts && typeof opts === 'object') ? opts : {}
-    assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
-    if (opts && 'offset' in opts) {
-      assert(typeof opts.offset === 'number', 'Offset must be a number')
-      query.offset = opts.offset
-    }
-    if (opts && 'limit' in opts) {
-      assert(typeof opts.limit === 'number', 'Limit must be a number')
-      query.limit = opts.limit
-    }
-    if (opts && opts.filters) {
-      if ('followedBy' in opts.filters) {
-        opts.filters.followedBy = normalizeFollowUrl(opts.filters.followedBy)
-        assert(typeof opts.filters.followedBy === 'string', 'Followed-by filter must be a valid URL')
-        query.followedBy = opts.filters.followedBy
-      }
-    }
-
-    query.includeDesc = true
-    var follows = await graphCrawler.listFollows(url, query)
-    return follows.map(massageSiteRecord)
-  },
-
-  /**
-   * @param {string} a
-   * @param {string} b
-   * @returns {Promise<boolean>}
-   */
-  async isAFollowingB (a, b) {
-    await assertPermission(this.sender, 'dangerousAppControl')
-
-    a = normalizeFollowUrl(a)
-    b = normalizeFollowUrl(b)
-
-    assert(a, 'The `a` parameter must be a valid URL')
-    assert(b, 'The `b` parameter must be a valid URL')
-
-    return graphCrawler.isAFollowingB(a, b)
-  },
-
-  /**
-   * @param {string} url
-   * @returns {Promise<void>}
-   */
-  async follow (url) {
-    await assertPermission(this.sender, 'dangerousAppControl')
-
-    url = normalizeFollowUrl(url)
-    assert(url, 'The `url` parameter must be a valid URL')
-
-    var userSession = globals.userSessionAPI.getFor(this.sender)
-    if (!userSession) throw new Error('No active user session')
-    var userArchive = dat.library.getArchive(userSession.url)
-
-    await graphCrawler.follow(userArchive, url)
-  },
-
-  /**
-   * @param {string} url
-   * @returns {Promise<void>}
-   */
-  async unfollow (url) {
-    await assertPermission(this.sender, 'dangerousAppControl')
-
-    url = normalizeFollowUrl(url)
-    assert(url, 'The `url` parameter must be a valid URL')
-
-    var userSession = globals.userSessionAPI.getFor(this.sender)
-    if (!userSession) throw new Error('No active user session')
-    var userArchive = dat.library.getArchive(userSession.url)
-
-    await graphCrawler.unfollow(userArchive, url)
-  }
-}
-
-// internal methods
-// =
-
-async function assertPermission (sender, perm) {
-  if (sender.getURL().startsWith('beaker:')) {
-    return true
-  }
-  if (await globals.permsAPI.requestPermission(perm, sender)) return true
-  throw new PermissionsError()
-}
-
-function normalizeFollowUrl (url) {
-  try {
-    url = new URL(url)
-    return url.protocol + '//' + url.hostname
-  } catch (e) {}
-  return null
-}
-
-function massageSiteRecord (site) {
-  return {
-    url: site.url,
-    title: site.title,
-    description: site.description,
-    type: site.type
-  }
-}
-
-function massageLinkRecord (link) {
-  return {
-    type: link.type,
-    src: massageSiteRecord(link.src),
-    dst: massageSiteRecord(link.dst),
-    crawledAt: link.crawledAt
-  }
-}
\ No newline at end of file
diff --git a/web-apis/fg/navigator-import.js b/web-apis/fg/navigator-import.js
index 3de01b6d..3a8d2aee 100644
--- a/web-apis/fg/navigator-import.js
+++ b/web-apis/fg/navigator-import.js
@@ -32,9 +32,9 @@ const APIs = {
     manifest: require('../manifests/external/unwalled-garden-posts'),
     create: makeCreateFn('unwalled-garden-posts')
   },
-  'unwalled-garden-graph': {
-    manifest: require('../manifests/external/unwalled-garden-graph'),
-    create: makeCreateFn('unwalled-garden-graph')
+  'unwalled-garden-follows': {
+    manifest: require('../manifests/external/unwalled-garden-follows'),
+    create: makeCreateFn('unwalled-garden-follows')
   },
   'unwalled-garden-reactions': {
     manifest: require('../manifests/external/unwalled-garden-reactions'),
diff --git a/web-apis/manifests/external/unwalled-garden-follows.js b/web-apis/manifests/external/unwalled-garden-follows.js
new file mode 100644
index 00000000..06aeb28a
--- /dev/null
+++ b/web-apis/manifests/external/unwalled-garden-follows.js
@@ -0,0 +1,7 @@
+module.exports = {
+  list: 'promise',
+  get: 'promise',
+  add: 'promise',
+  edit: 'promise',
+  remove: 'promise'
+}
\ No newline at end of file
diff --git a/web-apis/manifests/external/unwalled-garden-graph.js b/web-apis/manifests/external/unwalled-garden-graph.js
deleted file mode 100644
index 713a2196..00000000
--- a/web-apis/manifests/external/unwalled-garden-graph.js
+++ /dev/null
@@ -1,8 +0,0 @@
-module.exports = {
-  query: 'promise',
-  listFollowers: 'promise',
-  listFollows: 'promise',
-  isAFollowingB: 'promise',
-  follow: 'promise',
-  unfollow: 'promise'
-}
\ No newline at end of file

From b142a62bcb7221c39e99148ade2db1743536f33f Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 12 Jun 2019 16:14:40 -0500
Subject: [PATCH 175/245] Refactor unwalled-garden-posts to new schema and API
 definitions

---
 crawler/json-schemas/post.js                  |  16 +-
 crawler/posts.js                              | 163 ++++++++++--------
 web-apis/bg/unwalled-garden-follows.js        |   4 +-
 web-apis/bg/unwalled-garden-posts.js          | 121 +++++++------
 .../external/unwalled-garden-posts.js         |  10 +-
 5 files changed, 169 insertions(+), 145 deletions(-)

diff --git a/crawler/json-schemas/post.js b/crawler/json-schemas/post.js
index 17a31ade..2d30cc10 100644
--- a/crawler/json-schemas/post.js
+++ b/crawler/json-schemas/post.js
@@ -4,23 +4,17 @@ module.exports = {
   'type': 'object',
   'title': 'Post',
   'description': 'A broadcasted piece of content.',
-  'required': ['type', 'content', 'createdAt'],
+  'required': ['type', 'body', 'createdAt'],
   'properties': {
     'type': {
       'type': 'string',
       'description': "The object's type",
       'const': 'unwalled.garden/post'
     },
-    'content': {
-      'type': 'object',
-      'required': ['body'],
-      'properties': {
-        'body': {
-          'type': 'string',
-          'description': "The post's text body",
-          'maxLength': 280
-        }
-      }
+    'body': {
+      'type': 'string',
+      'description': "The post's text body",
+      'maxLength': 1000000
     },
     'createdAt': {
       'type': 'string',
diff --git a/crawler/posts.js b/crawler/posts.js
index 39c2814f..748bfd2d 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -5,6 +5,8 @@ const Ajv = require('ajv')
 const logger = require('../logger').child({category: 'crawler', dataset: 'posts'})
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
+const lock = require('../lib/lock')
+const knex = require('../lib/knex')
 const siteDescriptions = require('./site-descriptions')
 const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename, ensureDirectory, toOrigin} = require('./util')
 const postSchema = require('./json-schemas/post')
@@ -12,7 +14,7 @@ const postSchema = require('./json-schemas/post')
 // constants
 // =
 
-const TABLE_VERSION = 1
+const TABLE_VERSION = 2
 const JSON_TYPE = 'unwalled.garden/post'
 const JSON_PATH_REGEX = /^\/data\/posts\/([^/]+)\.json$/i
 
@@ -26,12 +28,11 @@ const JSON_PATH_REGEX = /^\/data\/posts\/([^/]+)\.json$/i
  *
  * @typedef {Object} Post
  * @prop {string} pathname
- * @prop {Object} content
- * @prop {string} content.body
- * @prop {number} crawledAt
- * @prop {number} createdAt
- * @prop {number} updatedAt
+ * @prop {string} body
+ * @prop {string} createdAt
+ * @prop {string} updatedAt
  * @prop {SiteDescription} author
+ * @prop {string} visibility
  */
 
 // globals
@@ -40,7 +41,6 @@ const JSON_PATH_REGEX = /^\/data\/posts\/([^/]+)\.json$/i
 const events = new Events()
 const ajv = (new Ajv())
 const validatePost = ajv.compile(postSchema)
-const validatePostContent = ajv.compile(postSchema.properties.content)
 
 // exported api
 // =
@@ -119,19 +119,19 @@ exports.crawlSite = async function (archive, crawlSource) {
         if (isNaN(post.updatedAt)) post.updatedAt = 0 // optional
 
         // upsert
-        let existingPost = await getPost(joinPath(archive.url, changedPost.name))
+        let existingPost = await get(joinPath(archive.url, changedPost.name))
         if (existingPost) {
           await db.run(`
             UPDATE crawl_posts
               SET crawledAt = ?, body = ?, createdAt = ?, updatedAt = ?
               WHERE crawlSourceId = ? AND pathname = ?
-          `, [Date.now(), post.content.body, post.createdAt, post.updatedAt, crawlSource.id, changedPost.name])
+          `, [Date.now(), post.body, post.createdAt, post.updatedAt, crawlSource.id, changedPost.name])
           events.emit('post-updated', archive.url)
         } else {
           await db.run(`
             INSERT INTO crawl_posts (crawlSourceId, pathname, crawledAt, body, createdAt, updatedAt)
               VALUES (?, ?, ?, ?, ?, ?)
-          `, [crawlSource.id, changedPost.name, Date.now(), post.content.body, post.createdAt, post.updatedAt])
+          `, [crawlSource.id, changedPost.name, Date.now(), post.body, post.createdAt, post.updatedAt])
           events.emit('post-added', archive.url)
         }
       }
@@ -151,13 +151,19 @@ exports.crawlSite = async function (archive, crawlSource) {
   * @param {Object} [opts]
   * @param {Object} [opts.filters]
   * @param {string|string[]} [opts.filters.authors]
+  * @param {string} [opts.filters.visibility]
+  * @param {string} [opts.sortBy]
   * @param {number} [opts.offset=0]
   * @param {number} [opts.limit]
   * @param {boolean} [opts.reverse]
  * @returns {Promise<Array<Post>>}
  */
-exports.query = async function (opts) {
+exports.list = async function (opts) {
+  // TODO: handle visibility
+  // TODO: sortBy options
+
   // validate & parse params
+  if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
   if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
   if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
   if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
@@ -171,37 +177,26 @@ exports.query = async function (opts) {
       }
       opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
     }
+    if ('visibility' in opts.filters) {
+      assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+    }
   }
 
   // build query
-  var query = `
-    SELECT crawl_posts.*, src.url AS crawlSourceUrl FROM crawl_posts
-      INNER JOIN crawl_sources src ON src.id = crawl_posts.crawlSourceId
-  `
+  var sql = knex('crawl_posts')
+    .select('crawl_posts.*')
+    .select('crawl_sources.url AS crawlSourceUrl')
+    .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_posts.crawlSourceId')
+    .orderBy('crawl_posts.createdAt', opts.reverse ? 'DESC' : 'ASC')
   var values = []
   if (opts && opts.filters && opts.filters.authors) {
-    let op = 'WHERE'
-    for (let a of opts.filters.authors) {
-      query += ` ${op} src.url = ?`
-      op = 'OR'
-      values.push(a)
-    }
-  }
-  query += ` ORDER BY createdAt`
-  if (opts && opts.reverse) {
-    query += ` DESC`
-  }
-  if (opts && opts.limit) {
-    query += ` LIMIT ?`
-    values.push(opts.limit)
-  }
-  if (opts && opts.offset) {
-    query += ` OFFSET ?`
-    values.push(opts.offset)
+    sql = sql.whereIn('crawl_sources.url', opts.filters.authors)
   }
+  if (opts && opts.limit) sql = sql.limit(opts.limit)
+  if (opts && opts.offset) sql = sql.offset(opts.offset)
 
   // execute query
-  var rows = await db.all(query, values)
+  var rows = await db.all(sql)
   return Promise.all(rows.map(massagePostRow))
 }
 
@@ -212,7 +207,7 @@ exports.query = async function (opts) {
  * @param {string} url - The URL of the post
  * @returns {Promise<Post>}
  */
-const getPost = exports.getPost = async function (url) {
+const get = exports.get = async function (url) {
   // validate & parse params
   var urlParsed
   if (url) {
@@ -221,16 +216,15 @@ const getPost = exports.getPost = async function (url) {
   }
 
   // execute query
-  return await massagePostRow(await db.get(`
-    SELECT
-        crawl_posts.*, src.url AS crawlSourceUrl
-      FROM crawl_posts
-      INNER JOIN crawl_sources src
-        ON src.id = crawl_posts.crawlSourceId
-        AND src.url = ?
-      WHERE
-        crawl_posts.pathname = ?
-  `, [`${urlParsed.protocol}//${urlParsed.hostname}`, urlParsed.pathname]))
+  var sql = knex('crawl_posts')
+    .select('crawl_posts.*')
+    .select('crawl_sources.url AS crawlSourceUrl')
+    .innerJoin('crawl_sources', function () {
+      this.on('crawl_sources.id', '=', 'crawl_posts.crawlSourceId')
+        .andOn('crawl_sources.url', '=', knex.raw('?', `${urlParsed.protocol}//${urlParsed.hostname}`))
+    })
+    .where('crawl_posts.pathname', urlParsed.pathname)
+  return await massagePostRow(await db.get(sql))
 }
 
 /**
@@ -238,23 +232,27 @@ const getPost = exports.getPost = async function (url) {
  * Create a new post.
  *
  * @param {InternalDatArchive} archive - where to write the post to.
- * @param {Object} content
- * @param {string} content.body
+ * @param {Object} post
+ * @param {string} post.body
+ * @param {string} post.visibility
  * @returns {Promise<string>} url
  */
-exports.addPost = async function (archive, content) {
-  var valid = validatePostContent(content)
-  if (!valid) throw ajv.errorsText(validatePostContent.errors)
+exports.add = async function (archive, post) {
+  // TODO visibility
+
+  var postObject = {
+    type: JSON_TYPE,
+    body: post.body,
+    createdAt: (new Date()).toISOString()
+  }
+  var valid = validatePost(postObject)
+  if (!valid) throw ajv.errorsText(validatePost.errors)
 
   var filename = generateTimeFilename()
   var filepath = `/data/posts/${filename}.json`
   await ensureDirectory(archive, '/data')
   await ensureDirectory(archive, '/data/posts')
-  await archive.pda.writeFile(filepath, JSON.stringify({
-    type: JSON_TYPE,
-    content,
-    createdAt: (new Date()).toISOString()
-  }, null, 2))
+  await archive.pda.writeFile(filepath, JSON.stringify(postObject, null, 2))
   await crawler.crawlSite(archive)
   return archive.url + filepath
 }
@@ -265,21 +263,38 @@ exports.addPost = async function (archive, content) {
  *
  * @param {InternalDatArchive} archive - where to write the post to.
  * @param {string} pathname - the pathname of the post.
- * @param {Object} content
- * @param {string} content.body
+ * @param {Object} post
+ * @param {string} [post.body]
+ * @param {string} [post.visibility]
  * @returns {Promise<void>}
  */
-exports.editPost = async function (archive, pathname, content) {
-  var valid = validatePostContent(content)
-  if (!valid) throw ajv.errorsText(validatePostContent.errors)
-  var oldJson = JSON.parse(await archive.pda.readFile(pathname))
-  await archive.pda.writeFile(pathname, JSON.stringify({
-    type: JSON_TYPE,
-    content,
-    createdAt: oldJson.createdAt,
-    updatedAt: (new Date()).toISOString()
-  }, null, 2))
-  await crawler.crawlSite(archive)
+exports.edit = async function (archive, pathname, post) {
+  // TODO visibility
+
+  var release = await lock('crawler:follows:' + archive.url)
+  try {
+    // fetch post
+    var existingPost = await get(archive.url + pathname)
+    if (!existingPost) throw new Error('Post not found')
+
+    // update post content
+    var postObject = {
+      type: JSON_TYPE,
+      body: ('body' in post) ? post.body : existingPost.body,
+      createdAt: existingPost.createdAt,
+      updatedAt: (new Date()).toISOString()
+    }
+
+    // validate
+    var valid = validatePost(postObject)
+    if (!valid) throw ajv.errorsText(validatePost.errors)
+
+    // write
+    await archive.pda.writeFile(pathname, JSON.stringify(postObject, null, 2))
+    await crawler.crawlSite(archive)
+  } finally {
+    release()
+  }
 }
 
 /**
@@ -290,7 +305,7 @@ exports.editPost = async function (archive, pathname, content) {
  * @param {string} pathname - the pathname of the post.
  * @returns {Promise<void>}
  */
-exports.deletePost = async function (archive, pathname) {
+exports.delete = async function (archive, pathname) {
   assert(typeof pathname === 'string', 'Delete() must be provided a valid URL string')
   await archive.pda.unlink(pathname)
   await crawler.crawlSite(archive)
@@ -334,11 +349,9 @@ async function massagePostRow (row) {
   return {
     pathname: row.pathname,
     author,
-    content: {
-      body: row.body
-    },
-    crawledAt: row.crawledAt,
-    createdAt: row.createdAt,
-    updatedAt: row.updatedAt
+    body: row.body,
+    createdAt: new Date(row.createdAt).toISOString(),
+    updatedAt: row.updatedAt ? new Date(row.updatedAt).toISOString() : null,
+    visibility: 'public' // TODO visibility
   }
 }
diff --git a/web-apis/bg/unwalled-garden-follows.js b/web-apis/bg/unwalled-garden-follows.js
index c1dfcca2..c33d601b 100644
--- a/web-apis/bg/unwalled-garden-follows.js
+++ b/web-apis/bg/unwalled-garden-follows.js
@@ -149,7 +149,7 @@ async function assertPermission (sender, perm) {
 }
 
 function getUserArchive (sender) {
-  var userSession = globals.userSessionAPI.getFor(this.sender)
+  var userSession = globals.userSessionAPI.getFor(sender)
   if (!userSession) throw new Error('No active user session')
   return dat.library.getArchive(userSession.url)
 }
@@ -167,7 +167,7 @@ function normalizeFollowUrl (url) {
 }
 
 /**
- * @param {Object} follow
+ * @param {Object} site
  * @returns {FollowsSitePublicAPIRecord}
  */
 function massageSiteRecord (site) {
diff --git a/web-apis/bg/unwalled-garden-posts.js b/web-apis/bg/unwalled-garden-posts.js
index bedd1670..79e7aa65 100644
--- a/web-apis/bg/unwalled-garden-posts.js
+++ b/web-apis/bg/unwalled-garden-posts.js
@@ -15,18 +15,13 @@ const postsCrawler = require('../../crawler/posts')
  * @prop {string} description
  * @prop {string[]} type
  *
- * @typedef {Object} PostReactionAuthorPublicAPIRecord
- * @prop {string} url
- * @prop {string} title
- *
  * @typedef {Object} PostPublicAPIRecord
  * @prop {string} url
- * @prop {Object} content
- * @prop {string} content.body
- * @prop {number} crawledAt
- * @prop {number} createdAt
- * @prop {number} updatedAt
+ * @prop {string} body
+ * @prop {string} createdAt
+ * @prop {string} updatedAt
  * @prop {PostAuthorPublicAPIRecord} author
+ * @prop {string} visibility
  */
 
 // exported api
@@ -37,14 +32,17 @@ module.exports = {
    * @param {Object} [opts]
    * @param {Object} [opts.filters]
    * @param {string|string[]} [opts.filters.authors]
+   * @param {string} [opts.filters.visibility]
+   * @param {string} [opts.sortBy]
    * @param {number} [opts.offset=0]
    * @param {number} [opts.limit]
    * @param {boolean} [opts.reverse]
    * @returns {Promise<PostPublicAPIRecord[]>}
    */
-  async query (opts) {
+  async list (opts) {
     await assertPermission(this.sender, 'dangerousAppControl')
     opts = (opts && typeof opts === 'object') ? opts : {}
+    if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
     if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
     if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
@@ -56,8 +54,11 @@ module.exports = {
           assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
         }
       }
+      if ('visibility' in opts.filters) {
+        assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+      }
     }
-    var posts = await postsCrawler.query(opts)
+    var posts = await postsCrawler.list(opts)
     return Promise.all(posts.map(massagePostRecord))
   },
 
@@ -65,71 +66,78 @@ module.exports = {
    * @param {string} url
    * @returns {Promise<PostPublicAPIRecord>}
    */
-  async getPost (url) {
+  async get (url) {
     await assertPermission(this.sender, 'dangerousAppControl')
-    return massagePostRecord(await postsCrawler.getPost(url))
+    return massagePostRecord(await postsCrawler.get(url))
   },
 
   /**
-   * @param {Object} post
-   * @param {Object} post.content
-   * @param {string} post.content.body
+   * @param {Object|string} post
+   * @param {string} post.body
+   * @param {string} [post.visibility]
    * @returns {Promise<PostPublicAPIRecord>}
    */
-  async addPost (post) {
+  async add (post) {
+    console.log('add()', post)
     await assertPermission(this.sender, 'dangerousAppControl')
+    var userArchive = getUserArchive(this.sender)
 
-    assert(post && typeof post === 'object', 'The `post` parameter must be an object')
-    assert(post.content && typeof post.content === 'object', 'The `post.content` parameter must be an object')
-    assert(post.content.body && typeof post.content.body === 'string', 'The `post.content.body` parameter must be a non-empty string')
+    // string usage
+    if (typeof post === 'string') {
+      post = {body: post}
+    }
 
-    var userSession = globals.userSessionAPI.getFor(this.sender)
-    if (!userSession) throw new Error('No active user session')
+    assert(post && typeof post === 'object', 'The `post` parameter must be a string or object')
+    assert(post.body && typeof post.body === 'string', 'The `post.body` parameter must be a non-empty string')
+    if ('visibility' in post) assert(typeof post.visibility === 'string', 'The `post.visibility` parameter must be "public" or "private"')
 
-    var userArchive = dat.library.getArchive(userSession.url)
-    var url = await postsCrawler.addPost(userArchive, post.content)
-    return massagePostRecord(await postsCrawler.getPost(url))
+    // default values
+    if (!post.visibility) {
+      post.visibility = 'public'
+    }
+
+    var url = await postsCrawler.add(userArchive, post)
+    return massagePostRecord(await postsCrawler.get(url))
   },
 
   /**
    * @param {string} url
-   * @param {Object} post
-   * @param {Object} post.content
-   * @param {string} post.content.body
+   * @param {Object|string} post
+   * @param {string} post.body
+   * @param {string} [post.visibility]
    * @returns {Promise<PostPublicAPIRecord>}
    */
-  async editPost (url, post) {
+  async edit (url, post) {
     await assertPermission(this.sender, 'dangerousAppControl')
+    var userArchive = getUserArchive(this.sender)
 
-    assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
-    assert(post && typeof post === 'object', 'The `post` parameter must be an object')
-    assert(post.content && typeof post.content === 'object', 'The `post.content` parameter must be an object')
-    assert(post.content.body && typeof post.content.body === 'string', 'The `post.content.body` parameter must be a non-empty string')
+    // string usage
+    if (typeof post === 'string') {
+      post = {body: post}
+    }
 
-    var userSession = globals.userSessionAPI.getFor(this.sender)
-    if (!userSession) throw new Error('No active user session')
-    var filepath = await urlToFilepath(url, userSession.url)
+    assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
+    assert(post && typeof post === 'object', 'The `post` parameter must be a string or object')
+    if ('body' in post) assert(typeof post.body === 'string', 'The `post.body` parameter must be a non-empty string')
+    if ('visibility' in post) assert(typeof post.visibility === 'string', 'The `post.visibility` parameter must be "public" or "private"')
 
-    var userArchive = dat.library.getArchive(userSession.url)
-    await postsCrawler.editPost(userArchive, filepath, post.content)
-    return massagePostRecord(await postsCrawler.getPost(userSession.url + filepath))
+    var filepath = await urlToFilepath(url, userArchive.url)
+    await postsCrawler.edit(userArchive, filepath, post)
+    return massagePostRecord(await postsCrawler.get(userArchive.url + filepath))
   },
 
   /**
    * @param {string} url
    * @returns {Promise<void>}
    */
-  async deletePost (url) {
+  async delete (url) {
     await assertPermission(this.sender, 'dangerousAppControl')
+    var userArchive = getUserArchive(this.sender)
 
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
 
-    var userSession = globals.userSessionAPI.getFor(this.sender)
-    if (!userSession) throw new Error('No active user session')
-    var filepath = await urlToFilepath(url, userSession.url)
-
-    var userArchive = dat.library.getArchive(userSession.url)
-    await postsCrawler.deletePost(userArchive, filepath)
+    var filepath = await urlToFilepath(url, userArchive.url)
+    await postsCrawler.delete(userArchive, filepath)
   }
 }
 
@@ -144,6 +152,12 @@ async function assertPermission (sender, perm) {
   throw new PermissionsError()
 }
 
+function getUserArchive (sender) {
+  var userSession = globals.userSessionAPI.getFor(sender)
+  if (!userSession) throw new Error('No active user session')
+  return dat.library.getArchive(userSession.url)
+}
+
 /**
  * Tries to parse the URL and return the pathname. If fails, assumes the string was a pathname.
  * @param {string} url
@@ -171,14 +185,16 @@ async function urlToFilepath (url, origin) {
   return filepath
 }
 
-async function massagePostRecord (post) {
+/**
+ * @param {Object} post
+ * @returns {PostPublicAPIRecord}
+ */
+function massagePostRecord (post) {
+  if (!post) return null
   var url =  post.author.url + post.pathname
   return {
     url,
-    content: {
-      body: post.content.body
-    },
-    crawledAt: post.crawledAt,
+    body: post.body,
     createdAt: post.createdAt,
     updatedAt: post.updatedAt,
     author: {
@@ -186,6 +202,7 @@ async function massagePostRecord (post) {
       title: post.author.title,
       description: post.author.description,
       type: post.author.type
-    }
+    },
+    visibility: post.visibility
   }
 }
diff --git a/web-apis/manifests/external/unwalled-garden-posts.js b/web-apis/manifests/external/unwalled-garden-posts.js
index 494754f2..ae73b73d 100644
--- a/web-apis/manifests/external/unwalled-garden-posts.js
+++ b/web-apis/manifests/external/unwalled-garden-posts.js
@@ -1,7 +1,7 @@
 module.exports = {
-  query: 'promise',
-  getPost: 'promise',
-  addPost: 'promise',
-  editPost: 'promise',
-  deletePost: 'promise'
+  list: 'promise',
+  get: 'promise',
+  add: 'promise',
+  edit: 'promise',
+  delete: 'promise'
 }
\ No newline at end of file

From eeee5b15bfeb24bc92631e0672e349e070ef1bec Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 12 Jun 2019 16:20:47 -0500
Subject: [PATCH 176/245] Update the profiles web API to match docs

---
 web-apis/bg/profiles.js                 | 2 +-
 web-apis/manifests/external/profiles.js | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/web-apis/bg/profiles.js b/web-apis/bg/profiles.js
index c8b703db..2a995a7f 100644
--- a/web-apis/bg/profiles.js
+++ b/web-apis/bg/profiles.js
@@ -35,7 +35,7 @@ module.exports = {
   /**
    * @returns {Promise<ProfilesPublicAPIRecord>}
    */
-  async getCurrentUser () {
+  async me () {
     await assertPermission(this.sender, 'dangerousAppControl')
     var sess = globals.userSessionAPI.getFor(this.sender)
     if (!sess) return null
diff --git a/web-apis/manifests/external/profiles.js b/web-apis/manifests/external/profiles.js
index 09633e67..98ad7243 100644
--- a/web-apis/manifests/external/profiles.js
+++ b/web-apis/manifests/external/profiles.js
@@ -1,5 +1,5 @@
 module.exports = {
-  getCurrentUser: 'promise',
+  me: 'promise',
   get: 'promise',
   index: 'promise'
 }
\ No newline at end of file

From 9d38cc55ce1c0193a7998e3e69ced6232d9462a7 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 12 Jun 2019 16:52:45 -0500
Subject: [PATCH 177/245] Update the reactions Web API to match docs

---
 crawler/reactions.js                          |  76 +++++++++---
 web-apis/bg/unwalled-garden-reactions.js      | 110 ++++++++++--------
 .../external/unwalled-garden-reactions.js     |   8 +-
 3 files changed, 128 insertions(+), 66 deletions(-)

diff --git a/crawler/reactions.js b/crawler/reactions.js
index 97a84275..f292c414 100644
--- a/crawler/reactions.js
+++ b/crawler/reactions.js
@@ -31,7 +31,7 @@ const JSON_PATH_REGEX = /^\/data\/reactions\/([^/]+)\.json$/i
  * @prop {string} recordUrl
  * @prop {number} crawledAt
  *
- * @typedef {Object} TopicReactions
+ * @typedef {Object} TopicReaction
  * @prop {string} emoji
  * @prop {string[]} authors
  */
@@ -140,13 +140,20 @@ exports.crawlSite = async function (archive, crawlSource) {
  * @param {Object} [opts]
  * @param {Object} [opts.filters]
  * @param {string|string[]} [opts.filters.authors]
+ * @param {string|string[]} [opts.filters.topics]
+ * @param {string} [opts.filters.visibility]
+ * @param {string} [opts.sortBy]
  * @param {number} [opts.offset=0]
  * @param {number} [opts.limit]
  * @param {boolean} [opts.reverse]
  * @returns {Promise<Array<Reaction>>}
  */
-exports.query = async function (opts) {
+exports.list = async function (opts) {
+  // TODO: handle visibility
+  // TODO: sortBy options
+
   // validate & parse params
+  if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
   if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
   if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
   if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
@@ -160,6 +167,17 @@ exports.query = async function (opts) {
       }
       opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
     }
+    if ('topics' in opts.filters) {
+      if (Array.isArray(opts.filters.topics)) {
+        assert(opts.filters.topics.every(v => typeof v === 'string'), 'Topics filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.topics === 'string', 'Topics filter must be a string or array of strings')
+        opts.filters.topics = [opts.filters.topics]
+      }
+    }
+    if ('visibility' in opts.filters) {
+      assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+    }
   }
 
   // execute query
@@ -173,6 +191,9 @@ exports.query = async function (opts) {
   if (opts && opts.filters && opts.filters.authors) {
     sql = sql.whereIn('crawl_sources.url', opts.filters.authors)
   }
+  if (opts && opts.filters && opts.filters.topics) {
+    sql = sql.whereIn('crawl_reactions.topic', opts.filters.topics)
+  }
   var rows = await db.all(sql)
 
   // massage results
@@ -187,23 +208,44 @@ exports.query = async function (opts) {
  * @description
  * List crawled reactions on a topic.
  *
- * @param {string} url - The URL of the topic
- * @returns {Promise<TopicReaction[]>}s
+ * @param {string} topic - The URL of the topic
+ * @param {Object} [opts]
+ * @param {Object} [opts.filters]
+ * @param {string|string[]} [opts.filters.authors]
+ * @param {string} [opts.filters.visibility]
+ * @returns {Promise<TopicReaction[]>}
  */
-const listReactions = exports.listReactions = async function (topic) {
+exports.tabulate = async function (topic, opts) {
+  // TODO handle visibility
+  
   // validate params
   try { new URL(topic) }
   catch (e) { throw new Error('Invalid URL: ' + topic) }
+  if (opts && opts.filters) {
+    if ('authors' in opts.filters) {
+      if (Array.isArray(opts.filters.authors)) {
+        assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        opts.filters.authors = [opts.filters.authors]
+      }
+      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+    }
+    if ('visibility' in opts.filters) {
+      assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+    }
+  }
 
   // execute query
-  var rows = await db.all(`
-    SELECT
-        crawl_reactions.*, src.url AS crawlSourceUrl
-      FROM crawl_reactions
-      INNER JOIN crawl_sources src ON src.id = crawl_reactions.crawlSourceId
-      WHERE
-        crawl_reactions.topic = ?
-  `, [topic])
+  var sql = knex('crawl_reactions')
+    .select('crawl_reactions.*')
+    .select('crawl_sources.url AS crawlSourceUrl')
+    .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_reactions.crawlSourceId')
+    .where('crawl_reactions.topic', topic)
+  if (opts && opts.filters && opts.filters.authors) {
+    sql = sql.whereIn('crawl_sources.url', opts.filters.authors)
+  }
+  var rows = await db.all(sql)
 
   // construct reactions list
   var reactions = {}
@@ -229,7 +271,9 @@ const listReactions = exports.listReactions = async function (topic) {
  * @param {string} emoji
  * @returns {Promise<void>}
  */
-exports.addReaction = async function (archive, topic, emoji) {
+exports.add = async function (archive, topic, emoji) {
+  // TODO handle visibility
+
   emoji = emoji.replace('\uFE0F', '').replace('\uFE0E', '') // strip the emoji-enforcement token
   var valid = validateReaction({type: JSON_TYPE, topic, emojis: [emoji]})
   if (!valid) throw ajv.errorsText(validateReaction.errors)
@@ -250,7 +294,9 @@ exports.addReaction = async function (archive, topic, emoji) {
  * @param {string} emoji
  * @returns {Promise<void>}
  */
-exports.deleteReaction = async function (archive, topic, emoji) {
+exports.delete = async function (archive, topic, emoji) {
+  // TODO handle visibility
+
   emoji = emoji.replace('\uFE0F', '').replace('\uFE0E', '') // strip the emoji-enforcement token
   var valid = validateReaction({type: JSON_TYPE, topic, emojis: [emoji]})
   if (!valid) throw ajv.errorsText(validateReaction.errors)
diff --git a/web-apis/bg/unwalled-garden-reactions.js b/web-apis/bg/unwalled-garden-reactions.js
index 5010123d..ebec0b0e 100644
--- a/web-apis/bg/unwalled-garden-reactions.js
+++ b/web-apis/bg/unwalled-garden-reactions.js
@@ -24,12 +24,11 @@ const siteDescriptionsCrawler = require('../../crawler/site-descriptions')
  * @prop {ReactionAuthorPublicAPIRecord[]} authors
  *
  * @typedef {Object} ReactionPublicAPIRecord
+ * @prop {string} url
  * @prop {string} topic
  * @prop {string[]} emojis
  * @prop {ReactionAuthorPublicAPIRecord} author
- * @prop {number} crawledAt
- * @prop {Object} record
- * @prop {string} record.url
+ * @prop {string} visibility
  */
 
 // exported api
@@ -40,14 +39,18 @@ module.exports = {
    * @param {Object} [opts]
    * @param {Object} [opts.filters]
    * @param {string|string[]} [opts.filters.authors]
+   * @param {string|string[]} [opts.filters.topics]
+   * @param {string} [opts.filters.visibility]
+   * @param {string} [opts.sortBy]
    * @param {number} [opts.offset=0]
    * @param {number} [opts.limit]
    * @param {boolean} [opts.reverse]
    * @returns {Promise<ReactionPublicAPIRecord[]>}
    */
-  async query (opts) {
+  async list (opts) {
     await assertPermission(this.sender, 'dangerousAppControl')
     opts = (opts && typeof opts === 'object') ? opts : {}
+    if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
     if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
     if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
@@ -59,24 +62,60 @@ module.exports = {
           assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
         }
       }
+      if ('topics' in opts.filters) {
+        if (Array.isArray(opts.filters.topics)) {
+          assert(opts.filters.topics.every(v => typeof v === 'string'), 'Topics filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.topics === 'string', 'Topics filter must be a string or array of strings')
+        }
+      }
+      if ('visibility' in opts.filters) {
+        assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+      }
     }
-    var reactions = await reactionsCrawler.query(opts)
+    var reactions = await reactionsCrawler.list(opts)
     return Promise.all(reactions.map(massageReactionRecord))
   },
 
-  innerListReactions,
-
   /**
    * @param {string} topic
+   * @param {Object} [opts]
+   * @param {string|string[]} [opts.filters.authors]
+   * @param {string} [opts.filters.visibility]
    * @returns {Promise<TopicReactionsPublicAPIRecord[]>}
    */
-  async listReactions (topic) {
+  async tabulate (topic, opts) {
     await assertPermission(this.sender, 'dangerousAppControl')
-
     topic = normalizeTopicUrl(topic)
     assert(topic && typeof topic === 'string', 'The `topic` parameter must be a valid URL')
+    opts = (opts && typeof opts === 'object') ? opts : {}
+    if (opts && opts.filters) {
+      if ('authors' in opts.filters) {
+        if (Array.isArray(opts.filters.authors)) {
+          assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        }
+      }
+      if ('visibility' in opts.filters) {
+        assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+      }
+    }
 
-    return innerListReactions(topic)
+    var reactions = await reactionsCrawler.tabulate(topic, opts)
+    return Promise.all(reactions.map(async (reaction) => ({
+      topic,
+      emoji: reaction.emoji,
+      authors: await Promise.all(reaction.authors.map(async (url) => {
+        var desc = await siteDescriptionsCrawler.getBest({subject: url})
+        return {
+          url: desc.url,
+          title: desc.title,
+          description: desc.description,
+          type: desc.type
+        }
+      }))
+    })))
   },
 
   /**
@@ -84,17 +123,14 @@ module.exports = {
    * @param {string} emoji
    * @returns {Promise<void>}
    */
-  async addReaction (topic, emoji) {
+  async add (topic, emoji) {
     await assertPermission(this.sender, 'dangerousAppControl')
+    var userArchive = getUserArchive(this.sender)
 
     topic = normalizeTopicUrl(topic)
     assert(topic && typeof topic === 'string', 'The `topic` parameter must be a valid URL')
 
-    var userSession = globals.userSessionAPI.getFor(this.sender)
-    if (!userSession) throw new Error('No active user session')
-    var userArchive = dat.library.getArchive(userSession.url)
-
-    await reactionsCrawler.addReaction(userArchive, topic, emoji)
+    await reactionsCrawler.add(userArchive, topic, emoji)
   },
 
   /**
@@ -102,17 +138,14 @@ module.exports = {
    * @param {string} emoji
    * @returns {Promise<void>}
    */
-  async deleteReaction (topic, emoji) {
+  async delete (topic, emoji) {
     await assertPermission(this.sender, 'dangerousAppControl')
+    var userArchive = getUserArchive(this.sender)
 
     topic = normalizeTopicUrl(topic)
     assert(topic && typeof topic === 'string', 'The `topic` parameter must be a valid URL')
 
-    var userSession = globals.userSessionAPI.getFor(this.sender)
-    if (!userSession) throw new Error('No active user session')
-    var userArchive = dat.library.getArchive(userSession.url)
-
-    await reactionsCrawler.deleteReaction(userArchive, topic, emoji)
+    await reactionsCrawler.delete(userArchive, topic, emoji)
   }
 }
 
@@ -127,6 +160,12 @@ async function assertPermission (sender, perm) {
   throw new PermissionsError()
 }
 
+function getUserArchive (sender) {
+  var userSession = globals.userSessionAPI.getFor(sender)
+  if (!userSession) throw new Error('No active user session')
+  return dat.library.getArchive(userSession.url)
+}
+
 function normalizeTopicUrl (url) {
   try {
     url = new URL(url)
@@ -135,27 +174,6 @@ function normalizeTopicUrl (url) {
   return null
 }
 
-/**
- * @param {string} topic
- * @returns {Promise<TopicReactionsPublicAPIRecord[]>}
- */
-async function innerListReactions (topic) {
-  var reactions = await reactionsCrawler.listReactions(topic)
-  return Promise.all(reactions.map(async (reaction) => ({
-    topic,
-    emoji: reaction.emoji,
-    authors: await Promise.all(reaction.authors.map(async (url) => {
-      var desc = await siteDescriptionsCrawler.getBest({subject: url})
-      return {
-        url: desc.url,
-        title: desc.title,
-        description: desc.description,
-        type: desc.type
-      }
-    }))
-  })))
-}
-
 /**
  * @param {Reaction} reaction
  * @returns {Promise<ReactionPublicAPIRecord>}
@@ -163,17 +181,15 @@ async function innerListReactions (topic) {
 async function massageReactionRecord (reaction) {
   var desc = await siteDescriptionsCrawler.getBest({subject: reaction.author})
   return {
+    url: reaction.recordUrl,
     topic: reaction.topic,
     emojis: reaction.emojis,
-    crawledAt: reaction.crawledAt,
     author: {
       url: desc.url,
       title: desc.title,
       description: desc.description,
       type: desc.type
     },
-    record: {
-      url: reaction.recordUrl
-    }
+    visibility: reaction.visibility
   }
 }
\ No newline at end of file
diff --git a/web-apis/manifests/external/unwalled-garden-reactions.js b/web-apis/manifests/external/unwalled-garden-reactions.js
index 8f3fdf2f..c335fc2b 100644
--- a/web-apis/manifests/external/unwalled-garden-reactions.js
+++ b/web-apis/manifests/external/unwalled-garden-reactions.js
@@ -1,6 +1,6 @@
 module.exports = {
-  query: 'promise',
-  listReactions: 'promise',
-  addReaction: 'promise',
-  deleteReaction: 'promise'
+  list: 'promise',
+  tabulate: 'promise',
+  add: 'promise',
+  delete: 'promise'
 }
\ No newline at end of file

From e64e90670dc783b11e5b24d0b5efd3337e367e4e Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 16 Jun 2019 15:12:44 -0500
Subject: [PATCH 178/245] Add unwalled-garden-comments web api

---
 crawler/comments.js                           | 531 ++++++++++++++++++
 crawler/index.js                              |   3 +
 crawler/json-schemas/comment.js               |  27 +-
 crawler/posts.js                              |   2 +-
 crawler/reactions.js                          |   2 +-
 dbs/profile-data-db.js                        |   3 +-
 dbs/schemas/profile-data.sql.js               |  31 +-
 dbs/schemas/profile-data.v27.sql.js           |  33 ++
 web-apis/bg.js                                |   3 +
 web-apis/bg/unwalled-garden-comments.js       | 299 ++++++++++
 web-apis/bg/unwalled-garden-posts.js          |   1 -
 web-apis/fg/navigator-import.js               |   4 +
 .../external/unwalled-garden-comments.js      |   8 +
 13 files changed, 922 insertions(+), 25 deletions(-)
 create mode 100644 crawler/comments.js
 create mode 100644 dbs/schemas/profile-data.v27.sql.js
 create mode 100644 web-apis/bg/unwalled-garden-comments.js
 create mode 100644 web-apis/manifests/external/unwalled-garden-comments.js

diff --git a/crawler/comments.js b/crawler/comments.js
new file mode 100644
index 00000000..9b8b06d5
--- /dev/null
+++ b/crawler/comments.js
@@ -0,0 +1,531 @@
+const assert = require('assert')
+const {URL} = require('url')
+const Events = require('events')
+const Ajv = require('ajv')
+const logger = require('../logger').child({category: 'crawler', dataset: 'comments'})
+const db = require('../dbs/profile-data-db')
+const crawler = require('./index')
+const lock = require('../lib/lock')
+const knex = require('../lib/knex')
+const siteDescriptions = require('./site-descriptions')
+const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename, ensureDirectory, toOrigin} = require('./util')
+const commentSchema = require('./json-schemas/comment')
+
+// constants
+// =
+
+const TABLE_VERSION = 1
+const JSON_TYPE = 'unwalled.garden/comment'
+const JSON_PATH_REGEX = /^\/data\/comments\/([^/]+)\.json$/i
+
+// typedefs
+// =
+
+/**
+ * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
+ * @typedef {import('./util').CrawlSourceRecord} CrawlSourceRecord
+ * @typedef { import("./site-descriptions").SiteDescription } SiteDescription
+ *
+ * @typedef {Object} Comment
+ * @prop {string} pathname
+ * @prop {string} topic
+ * @prop {string} replyTo
+ * @prop {string} body
+ * @prop {string} createdAt
+ * @prop {string} updatedAt
+ * @prop {SiteDescription} author
+ * @prop {string} visibility
+ *
+ * @typedef {Object} ThreadedComment
+ * @prop {string} pathname
+ * @prop {string} topic
+ * @prop {string} replyTo
+ * @prop {ThreadedComment[]} replies
+ * @prop {number} replyCount
+ * @prop {string} body
+ * @prop {string} createdAt
+ * @prop {string} updatedAt
+ * @prop {SiteDescription} author
+ * @prop {string} visibility
+ */
+
+// globals
+// =
+
+const events = new Events()
+const ajv = (new Ajv())
+const validateComment = ajv.compile(commentSchema)
+
+// exported api
+// =
+
+exports.on = events.on.bind(events)
+exports.addListener = events.addListener.bind(events)
+exports.removeListener = events.removeListener.bind(events)
+
+/**
+ * @description
+ * Crawl the given site for comments.
+ *
+ * @param {InternalDatArchive} archive - site to crawl.
+ * @param {CrawlSourceRecord} crawlSource - internal metadata about the crawl target.
+ * @returns {Promise}
+ */
+exports.crawlSite = async function (archive, crawlSource) {
+  return doCrawl(archive, crawlSource, 'crawl_comments', TABLE_VERSION, async ({changes, resetRequired}) => {
+    const supressEvents = resetRequired === true // dont emit when replaying old info
+    logger.silly('Crawling comments', {details: {url: archive.url, numChanges: changes.length, resetRequired}})
+    if (resetRequired) {
+      // reset all data
+      logger.debug('Resetting dataset', {details: {url: archive.url}})
+      await db.run(`
+        DELETE FROM crawl_comments WHERE crawlSourceId = ?
+      `, [crawlSource.id])
+      await doCheckpoint('crawl_comments', TABLE_VERSION, crawlSource, 0)
+    }
+
+    // collect changed comments
+    var changedComments = getMatchingChangesInOrder(changes, JSON_PATH_REGEX)
+    if (changedComments.length) {
+      logger.verbose('Collected new/changed comment files', {details: {url: archive.url, changedComments: changedComments.map(p => p.name)}})
+    } else {
+      logger.debug('No new comment-files found', {details: {url: archive.url}})
+    }
+    emitProgressEvent(archive.url, 'crawl_comments', 0, changedComments.length)
+
+    // read and apply each comment in order
+    var progress = 0
+    for (let changedComment of changedComments) {
+      // TODO Currently the crawler will abort reading the feed if any comment fails to load
+      //      this means that a single unreachable file can stop the forward progress of comment indexing
+      //      to solve this, we need to find a way to tolerate unreachable comment-files without losing our ability to efficiently detect new comments
+      //      -prf
+      if (changedComment.type === 'del') {
+        // delete
+        await db.run(`
+          DELETE FROM crawl_comments WHERE crawlSourceId = ? AND pathname = ?
+        `, [crawlSource.id, changedComment.name])
+        events.emit('comment-removed', archive.url)
+      } else {
+        // read
+        let commentString
+        try {
+          commentString = await archive.pda.readFile(changedComment.name, 'utf8')
+        } catch (err) {
+          logger.warn('Failed to read comment file, aborting', {details: {url: archive.url, name: changedComment.name, err}})
+          return // abort indexing
+        }
+
+        // parse and validate
+        let comment
+        try {
+          comment = JSON.parse(commentString)
+          let valid = validateComment(comment)
+          if (!valid) throw ajv.errorsText(validateComment.errors)
+        } catch (err) {
+          logger.warn('Failed to parse comment file, skipping', {details: {url: archive.url, name: changedComment.name, err}})
+          continue // skip
+        }
+
+        // massage the comment
+        comment.repliesTo = comment.repliesTo || ''
+        comment.createdAt = Number(new Date(comment.createdAt))
+        comment.updatedAt = Number(new Date(comment.updatedAt))
+        if (isNaN(comment.updatedAt)) comment.updatedAt = 0 // optional
+
+        // upsert
+        let existingComment = await get(joinPath(archive.url, changedComment.name))
+        if (existingComment) {
+          await db.run(`
+            UPDATE crawl_comments
+              SET crawledAt = ?, topic = ?, replyTo = ?, body = ?, createdAt = ?, updatedAt = ?
+              WHERE crawlSourceId = ? AND pathname = ?
+          `, [Date.now(), comment.topic, comment.replyTo, comment.body, comment.createdAt, comment.updatedAt, crawlSource.id, changedComment.name])
+          events.emit('comment-updated', archive.url)
+        } else {
+          await db.run(`
+            INSERT INTO crawl_comments (crawlSourceId, pathname, crawledAt, topic, replyTo, body, createdAt, updatedAt)
+              VALUES (?, ?, ?, ?, ?, ?, ?, ?)
+          `, [crawlSource.id, changedComment.name, Date.now(), comment.topic, comment.replyTo, comment.body, comment.createdAt, comment.updatedAt])
+          events.emit('comment-added', archive.url)
+        }
+      }
+
+      // checkpoint our progress
+      await doCheckpoint('crawl_comments', TABLE_VERSION, crawlSource, changedComment.version)
+      emitProgressEvent(archive.url, 'crawl_comments', ++progress, changedComments.length)
+    }
+    logger.silly(`Finished crawling comments`, {details: {url: archive.url}})
+  })
+}
+
+/**
+ * @description
+ * List crawled comments.
+ *
+  * @param {Object} [opts]
+  * @param {Object} [opts.filters]
+  * @param {string|string[]} [opts.filters.authors]
+  * @param {string|string[]} [opts.filters.topics]
+  * @param {string} [opts.filters.visibility]
+  * @param {string} [opts.sortBy]
+  * @param {number} [opts.offset=0]
+  * @param {number} [opts.limit]
+  * @param {boolean} [opts.reverse]
+ * @returns {Promise<Array<Comment>>}
+ */
+exports.list = async function (opts) {
+  // TODO: handle visibility
+  // TODO: sortBy options
+
+  // validate & parse params
+  if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
+  if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+  if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+  if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+  if (opts && opts.filters) {
+    if ('authors' in opts.filters) {
+      if (Array.isArray(opts.filters.authors)) {
+        assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        opts.filters.authors = [opts.filters.authors]
+      }
+      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+    }
+    if ('topics' in opts.filters) {
+      if (Array.isArray(opts.filters.topics)) {
+        assert(opts.filters.topics.every(v => typeof v === 'string'), 'Topics filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.topics === 'string', 'Topics filter must be a string or array of strings')
+        opts.filters.topics = [opts.filters.topics]
+      }
+    }
+    if ('visibility' in opts.filters) {
+      assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+    }
+  }
+
+  // build query
+  var sql = knex('crawl_comments')
+    .select('crawl_comments.*')
+    .select('crawl_sources.url AS crawlSourceUrl')
+    .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_comments.crawlSourceId')
+    .orderBy('crawl_comments.createdAt', opts.reverse ? 'DESC' : 'ASC')
+  if (opts && opts.filters && opts.filters.authors) {
+    sql = sql.whereIn('crawl_sources.url', opts.filters.authors)
+  }
+  if (opts && opts.filters && opts.filters.topics) {
+    sql = sql.whereIn('crawl_comments.topic', opts.filters.topics)
+  }
+  if (opts && opts.limit) sql = sql.limit(opts.limit)
+  if (opts && opts.offset) sql = sql.offset(opts.offset)
+
+  // execute query
+  var rows = await db.all(sql)
+  return Promise.all(rows.map(massageCommentRow))
+}
+
+/**
+ * @description
+ * List crawled comments.
+ * @param {string} topic
+ * @param {Object} [opts]
+ * @param {Object} [opts.filters]
+ * @param {string|string[]} [opts.filters.authors]
+ * @param {string} [opts.filters.visibility]
+ * @param {string} [opts.parent]
+ * @param {number} [opts.depth]
+ * @param {string} [opts.sortBy]
+ * @param {boolean} [opts.reverse]
+ * @returns {Promise<Array<Comment>>}
+ */
+exports.thread = async function (topic, opts) {
+  // TODO: handle visibility
+  // TODO: sortBy options
+
+  // validate & parse params
+  assert(typeof topic === 'string', 'Topic must be a URL string')
+  if (opts && 'parent' in opts) assert(typeof opts.parent === 'string', 'Parent must be a string')
+  if (opts && 'depth' in opts) assert(typeof opts.depth === 'number', 'Depth must be a number')
+  if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
+  if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+  if (opts && opts.filters) {
+    if ('authors' in opts.filters) {
+      if (Array.isArray(opts.filters.authors)) {
+        assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        opts.filters.authors = [opts.filters.authors]
+      }
+      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+    }
+    if ('visibility' in opts.filters) {
+      assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+    }
+  }
+
+  // build query
+  var sql = knex('crawl_comments')
+    .select('crawl_comments.*')
+    .select('crawl_sources.url AS crawlSourceUrl')
+    .where('crawl_comments.topic', topic)
+    .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_comments.crawlSourceId')
+    .orderBy('crawl_comments.createdAt', opts.reverse ? 'DESC' : 'ASC')
+  if (opts && opts.filters && opts.filters.authors) {
+    sql = sql.whereIn('crawl_sources.url', opts.filters.authors)
+  }
+
+  // execute query
+  var rows = await db.all(sql)
+
+  // create a map of comments by their URL
+  var commentsByUrl = {}
+  rows.forEach(row => { commentsByUrl[joinPath(row.crawlSourceUrl, row.pathname)] = row })
+
+  // attach each comment to its parent, forming a tree
+  var rootComments = []
+  rows.forEach(row => {
+    if (row.replyTo) {
+      let parent = commentsByUrl[row.replyTo]
+      if (!parent) {
+        // TODO insert a placeholder parent when not found
+        // something that means "this post was by somebody you dont follow"
+        // -prf
+        return
+      }
+      if (!parent.replies) {
+        parent.replies = []
+        parent.replyCount = 0
+      }
+      parent.replies.push(row)
+      parent.replyCount++
+    } else {
+      rootComments.push(row)
+    }
+  })
+
+  // apply the parent filter
+  if (opts && opts.parent) {
+    rootComments = []
+    rows.forEach(row => {
+      if (row.replyTo === opts.parent) {
+        rootComments.push(row)
+      }
+    })
+  }
+
+  // apply the depth limit
+  if (opts && opts.depth) {
+    let recursiveApplyDepth = (currentDepth, comment) => {
+      if (!comment.replies) return
+      if (currentDepth === opts.depth) {
+        comment.replies = null
+      } else {
+        comment.replies.forEach(reply => recursiveApplyDepth(currentDepth + 1, reply))
+      }
+    }
+    rootComments.forEach(comment => recursiveApplyDepth(1, comment))
+  }
+
+  return Promise.all(rootComments.map(massageThreadedCommentRow))
+}
+
+/**
+ * @description
+ * Get crawled comment.
+ *
+ * @param {string} url - The URL of the comment
+ * @returns {Promise<Comment>}
+ */
+const get = exports.get = async function (url) {
+  // validate & parse params
+  var urlParsed
+  if (url) {
+    try { urlParsed = new URL(url) }
+    catch (e) { throw new Error('Invalid URL: ' + url) }
+  }
+
+  // execute query
+  var sql = knex('crawl_comments')
+    .select('crawl_comments.*')
+    .select('crawl_sources.url AS crawlSourceUrl')
+    .innerJoin('crawl_sources', function () {
+      this.on('crawl_sources.id', '=', 'crawl_comments.crawlSourceId')
+        .andOn('crawl_sources.url', '=', knex.raw('?', `${urlParsed.protocol}//${urlParsed.hostname}`))
+    })
+    .where('crawl_comments.pathname', urlParsed.pathname)
+  return await massageCommentRow(await db.get(sql))
+}
+
+/**
+ * @description
+ * Create a new comment.
+ *
+ * @param {InternalDatArchive} archive - where to write the comment to.
+ * @param {string} topic
+ * @param {Object} comment
+ * @param {string} comment.replyTo
+ * @param {string} comment.body
+ * @param {string} comment.visibility
+ * @returns {Promise<string>} url
+ */
+exports.add = async function (archive, topic, comment) {
+  // TODO visibility
+
+  var commentObject = {
+    type: JSON_TYPE,
+    topic,
+    replyTo: comment.replyTo,
+    body: comment.body,
+    createdAt: (new Date()).toISOString()
+  }
+  var valid = validateComment(commentObject)
+  if (!valid) throw ajv.errorsText(validateComment.errors)
+
+  var filename = generateTimeFilename()
+  var filepath = `/data/comments/${filename}.json`
+  await ensureDirectory(archive, '/data')
+  await ensureDirectory(archive, '/data/comments')
+  await archive.pda.writeFile(filepath, JSON.stringify(commentObject, null, 2))
+  await crawler.crawlSite(archive)
+  return archive.url + filepath
+}
+
+/**
+ * @description
+ * Update the content of an existing comment.
+ *
+ * @param {InternalDatArchive} archive - where to write the comment to.
+ * @param {string} pathname - the pathname of the comment.
+ * @param {Object} comment
+ * @param {string} [comment.replyTo]
+ * @param {string} [comment.body]
+ * @param {string} [comment.visibility]
+ * @returns {Promise<void>}
+ */
+exports.edit = async function (archive, pathname, comment) {
+  // TODO visibility
+
+  var release = await lock('crawler:comments:' + archive.url)
+  try {
+    // fetch comment
+    var existingComment = await get(archive.url + pathname)
+    if (!existingComment) throw new Error('Comment not found')
+
+    // update comment content
+    var commentObject = {
+      type: JSON_TYPE,
+      topic: existingComment.topic,
+      replyTo: ('replyTo' in comment) ? comment.replyTo : existingComment.replyTo,
+      body: ('body' in comment) ? comment.body : existingComment.body,
+      createdAt: existingComment.createdAt,
+      updatedAt: (new Date()).toISOString()
+    }
+
+    // validate
+    var valid = validateComment(commentObject)
+    if (!valid) throw ajv.errorsText(validateComment.errors)
+
+    // write
+    await archive.pda.writeFile(pathname, JSON.stringify(commentObject, null, 2))
+    await crawler.crawlSite(archive)
+  } finally {
+    release()
+  }
+}
+
+/**
+ * @description
+ * Delete an existing comment
+ *
+ * @param {InternalDatArchive} archive - where to write the comment to.
+ * @param {string} pathname - the pathname of the comment.
+ * @returns {Promise<void>}
+ */
+exports.delete = async function (archive, pathname) {
+  assert(typeof pathname === 'string', 'Delete() must be provided a valid URL string')
+  await archive.pda.unlink(pathname)
+  await crawler.crawlSite(archive)
+}
+
+// internal methods
+// =
+
+/**
+ * @param {string} origin
+ * @param {string} pathname
+ * @returns {string}
+ */
+function joinPath (origin, pathname) {
+  if (origin.endsWith('/') && pathname.startsWith('/')) {
+    return origin + pathname.slice(1)
+  }
+  if (!origin.endsWith('/') && !pathname.startsWith('/')) {
+    return origin + '/' + pathname
+  }
+  return origin + pathname
+}
+
+/**
+ * @param {Object} row
+ * @returns {Promise<Comment>}
+ */
+async function massageCommentRow (row) {
+  if (!row) return null
+  var author = await siteDescriptions.getBest({subject: row.crawlSourceUrl})
+  if (!author) {
+    author = {
+      url: row.crawlSourceUrl,
+      title: '',
+      description: '',
+      type: [],
+      thumbUrl: `${row.crawlSourceUrl}/thumb`,
+      descAuthor: {url: null}
+    }
+  }
+  return {
+    pathname: row.pathname,
+    author,
+    topic: row.topic,
+    replyTo: row.replyTo,
+    body: row.body,
+    createdAt: new Date(row.createdAt).toISOString(),
+    updatedAt: row.updatedAt ? new Date(row.updatedAt).toISOString() : null,
+    visibility: 'public' // TODO visibility
+  }
+}
+
+/**
+ * @param {Object} row
+ * @returns {Promise<ThreadedComment>}
+ */
+async function massageThreadedCommentRow (row) {
+  if (!row) return null
+  if (row.replies) {
+    row.replies = await Promise.all(row.replies.map(massageThreadedCommentRow))
+  }
+  var author = await siteDescriptions.getBest({subject: row.crawlSourceUrl})
+  if (!author) {
+    author = {
+      url: row.crawlSourceUrl,
+      title: '',
+      description: '',
+      type: [],
+      thumbUrl: `${row.crawlSourceUrl}/thumb`,
+      descAuthor: {url: null}
+    }
+  }
+  return {
+    pathname: row.pathname,
+    author,
+    topic: row.topic,
+    replyTo: row.replyTo,
+    body: row.body,
+    replies: row.replies || null,
+    replyCount: row.replyCount || 0,
+    createdAt: new Date(row.createdAt).toISOString(),
+    updatedAt: row.updatedAt ? new Date(row.updatedAt).toISOString() : null,
+    visibility: 'public' // TODO visibility
+  }
+}
diff --git a/crawler/index.js b/crawler/index.js
index 9285a515..e728864b 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -7,6 +7,7 @@ const archivesDb = require('../dbs/archives')
 const dat = require('../dat')
 
 const {crawlerEvents, toHostname} = require('./util')
+const comments = require('./comments')
 const posts = require('./posts')
 const bookmarks = require('./bookmarks')
 const follows = require('./follows')
@@ -21,6 +22,7 @@ var watches = {}
 // exported api
 // =
 
+exports.comments = comments
 exports.posts = posts
 exports.bookmarks = bookmarks
 exports.follows = follows
@@ -85,6 +87,7 @@ exports.crawlSite = async function (archive) {
 
     // crawl individual sources
     await Promise.all([
+      comments.crawlSite(archive, crawlSource),
       posts.crawlSite(archive, crawlSource),
       bookmarks.crawlSite(archive, crawlSource),
       follows.crawlSite(archive, crawlSource),
diff --git a/crawler/json-schemas/comment.js b/crawler/json-schemas/comment.js
index c28578f0..595a15ad 100644
--- a/crawler/json-schemas/comment.js
+++ b/crawler/json-schemas/comment.js
@@ -7,7 +7,7 @@ module.exports = {
   'required': [
     'type',
     'topic',
-    'content',
+    'body',
     'createdAt'
   ],
   'properties': {
@@ -19,28 +19,16 @@ module.exports = {
     'topic': {
       'type': 'string',
       'description': 'What this comment is about',
-      'format': 'uri',
-      'examples': [
-        'dat://beakerbrowser.com'
-      ]
+      'format': 'uri'
     },
     'replyTo': {
       'type': 'string',
       'description': 'What this comment is replying to',
-      'format': 'uri',
-      'examples': [
-        'dat://beakerbrowser.com'
-      ]
+      'format': 'uri'
     },
-    'content': {
-      'type': 'object',
-      'required': ['body'],
-      'properties': {
-        'body': {
-          'type': 'string',
-          'description': "The post's text content"
-        }
-      }
+    'body': {
+      'type': 'string',
+      'description': "The post's text content"
     },
     'createdAt': {
       'type': 'string',
@@ -52,6 +40,5 @@ module.exports = {
       'format': 'date-time',
       'description': "The time of this post's last edit"
     }
-  },
-  'additionalProperties': false
+  }
 }
\ No newline at end of file
diff --git a/crawler/posts.js b/crawler/posts.js
index 748bfd2d..cff13c72 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -271,7 +271,7 @@ exports.add = async function (archive, post) {
 exports.edit = async function (archive, pathname, post) {
   // TODO visibility
 
-  var release = await lock('crawler:follows:' + archive.url)
+  var release = await lock('crawler:posts:' + archive.url)
   try {
     // fetch post
     var existingPost = await get(archive.url + pathname)
diff --git a/crawler/reactions.js b/crawler/reactions.js
index f292c414..08eb97d3 100644
--- a/crawler/reactions.js
+++ b/crawler/reactions.js
@@ -217,7 +217,7 @@ exports.list = async function (opts) {
  */
 exports.tabulate = async function (topic, opts) {
   // TODO handle visibility
-  
+
   // validate params
   try { new URL(topic) }
   catch (e) { throw new Error('Invalid URL: ' + topic) }
diff --git a/dbs/profile-data-db.js b/dbs/profile-data-db.js
index b2cc18d3..c11dbd2e 100644
--- a/dbs/profile-data-db.js
+++ b/dbs/profile-data-db.js
@@ -113,7 +113,8 @@ migrations = [
   migration('profile-data.v23.sql'),
   migration('profile-data.v24.sql'),
   migration('profile-data.v25.sql'),
-  migration('profile-data.v26.sql')
+  migration('profile-data.v26.sql'),
+  migration('profile-data.v27.sql')
 ]
 function migration (file, opts = {}) {
   return cb => {
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index bb0f1196..523f55d9 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -183,6 +183,35 @@ CREATE TRIGGER crawl_posts_au AFTER UPDATE ON crawl_posts BEGIN
   INSERT INTO crawl_posts_fts_index(rowid, body) VALUES (new.rowid, new.body);
 END;
 
+-- crawled comments
+CREATE TABLE crawl_comments (
+  crawlSourceId INTEGER NOT NULL,
+  pathname TEXT NOT NULL,
+  crawledAt INTEGER,
+
+  topic TEXT,
+  replyTo TEXT,
+  body TEXT,
+  createdAt INTEGER,
+  updatedAt INTEGER,
+
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+CREATE INDEX crawl_comments_topic ON crawl_comments (topic);
+CREATE VIRTUAL TABLE crawl_comments_fts_index USING fts5(body, content='crawl_comments');
+
+-- triggers to keep crawl_comments_fts_index updated
+CREATE TRIGGER crawl_comments_ai AFTER INSERT ON crawl_comments BEGIN
+  INSERT INTO crawl_comments_fts_index(rowid, body) VALUES (new.rowid, new.body);
+END;
+CREATE TRIGGER crawl_comments_ad AFTER DELETE ON crawl_comments BEGIN
+  INSERT INTO crawl_comments_fts_index(crawl_comments_fts_index, rowid, body) VALUES('delete', old.rowid, old.body);
+END;
+CREATE TRIGGER crawl_comments_au AFTER UPDATE ON crawl_comments BEGIN
+  INSERT INTO crawl_comments_fts_index(crawl_comments_fts_index, rowid, body) VALUES('delete', old.rowid, old.body);
+  INSERT INTO crawl_comments_fts_index(rowid, body) VALUES (new.rowid, new.body);
+END;
+
 -- crawled reactions
 CREATE TABLE crawl_reactions (
   crawlSourceId INTEGER NOT NULL,
@@ -300,5 +329,5 @@ INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Library', 'beaker://library/', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker.Social', 'dat://beaker.social', 1);
 
-PRAGMA user_version = 26;
+PRAGMA user_version = 27;
 `
diff --git a/dbs/schemas/profile-data.v27.sql.js b/dbs/schemas/profile-data.v27.sql.js
new file mode 100644
index 00000000..fd957488
--- /dev/null
+++ b/dbs/schemas/profile-data.v27.sql.js
@@ -0,0 +1,33 @@
+module.exports = `
+
+-- add crawled comments
+CREATE TABLE crawl_comments (
+  crawlSourceId INTEGER NOT NULL,
+  pathname TEXT NOT NULL,
+  crawledAt INTEGER,
+
+  topic TEXT,
+  replyTo TEXT,
+  body TEXT,
+  createdAt INTEGER,
+  updatedAt INTEGER,
+
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+CREATE INDEX crawl_comments_topic ON crawl_comments (topic);
+CREATE VIRTUAL TABLE crawl_comments_fts_index USING fts5(body, content='crawl_comments');
+
+-- triggers to keep crawl_comments_fts_index updated
+CREATE TRIGGER crawl_comments_ai AFTER INSERT ON crawl_comments BEGIN
+  INSERT INTO crawl_comments_fts_index(rowid, body) VALUES (new.rowid, new.body);
+END;
+CREATE TRIGGER crawl_comments_ad AFTER DELETE ON crawl_comments BEGIN
+  INSERT INTO crawl_comments_fts_index(crawl_comments_fts_index, rowid, body) VALUES('delete', old.rowid, old.body);
+END;
+CREATE TRIGGER crawl_comments_au AFTER UPDATE ON crawl_comments BEGIN
+  INSERT INTO crawl_comments_fts_index(crawl_comments_fts_index, rowid, body) VALUES('delete', old.rowid, old.body);
+  INSERT INTO crawl_comments_fts_index(rowid, body) VALUES (new.rowid, new.body);
+END;
+
+PRAGMA user_version = 27;
+`
diff --git a/web-apis/bg.js b/web-apis/bg.js
index 5680516c..b3d328f0 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -29,6 +29,7 @@ const bookmarksManifest = require('./manifests/external/bookmarks')
 const libraryManifest = require('./manifests/external/library')
 const profilesManifest = require('./manifests/external/profiles')
 const searchManifest = require('./manifests/external/search')
+const commentsManifest = require('./manifests/external/unwalled-garden-comments')
 const postsManifest = require('./manifests/external/unwalled-garden-posts')
 const followsManifest = require('./manifests/external/unwalled-garden-follows')
 const reactionsManifest = require('./manifests/external/unwalled-garden-reactions')
@@ -40,6 +41,7 @@ const bookmarksAPI = require('./bg/bookmarks')
 const libraryAPI = require('./bg/library')
 const profilesAPI = require('./bg/profiles')
 const searchAPI = require('./bg/search')
+const commentsAPI = require('./bg/unwalled-garden-comments')
 const postsAPI = require('./bg/unwalled-garden-posts')
 const followsAPI = require('./bg/unwalled-garden-follows')
 const reactionsAPI = require('./bg/unwalled-garden-reactions')
@@ -76,6 +78,7 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('library', libraryManifest, libraryAPI, secureOnly)
   globals.rpcAPI.exportAPI('profiles', profilesManifest, profilesAPI, secureOnly)
   globals.rpcAPI.exportAPI('search', searchManifest, searchAPI, secureOnly)
+  globals.rpcAPI.exportAPI('unwalled-garden-comments', commentsManifest, commentsAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-posts', postsManifest, postsAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-follows', followsManifest, followsAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-reactions', reactionsManifest, reactionsAPI, secureOnly)
diff --git a/web-apis/bg/unwalled-garden-comments.js b/web-apis/bg/unwalled-garden-comments.js
new file mode 100644
index 00000000..bf6866df
--- /dev/null
+++ b/web-apis/bg/unwalled-garden-comments.js
@@ -0,0 +1,299 @@
+const globals = require('../../globals')
+const assert = require('assert')
+const {URL} = require('url')
+const {PermissionsError} = require('beaker-error-constants')
+const dat = require('../../dat')
+const commentsCrawler = require('../../crawler/comments')
+
+// typedefs
+// =
+
+/**
+ * @typedef {Object} CommentAuthorPublicAPIRecord
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {string[]} type
+ *
+ * @typedef {Object} CommentPublicAPIRecord
+ * @prop {string} url
+ * @prop {string} topic
+ * @prop {string} replyTo
+ * @prop {string} body
+ * @prop {string} createdAt
+ * @prop {string} updatedAt
+ * @prop {CommentAuthorPublicAPIRecord} author
+ * @prop {string} visibility
+ *
+ * @typedef {Object} ThreadedCommentPublicAPIRecord
+ * @prop {string} url
+ * @prop {string} topic
+ * @prop {string} replyTo
+ * @prop {string} body
+ * @prop {ThreadedCommentPublicAPIRecord[]} replies
+ * @prop {number} replyCount
+ * @prop {string} createdAt
+ * @prop {string} updatedAt
+ * @prop {CommentAuthorPublicAPIRecord} author
+ * @prop {string} visibility
+ */
+
+// exported api
+// =
+
+module.exports = {
+  /**
+   * @param {Object} [opts]
+   * @param {Object} [opts.filters]
+   * @param {string|string[]} [opts.filters.authors]
+   * @param {string|string[]} [opts.filters.topics]
+   * @param {string} [opts.filters.visibility]
+   * @param {string} [opts.sortBy]
+   * @param {number} [opts.offset=0]
+   * @param {number} [opts.limit]
+   * @param {boolean} [opts.reverse]
+   * @returns {Promise<CommentPublicAPIRecord[]>}
+   */
+  async list (opts) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    opts = (opts && typeof opts === 'object') ? opts : {}
+    if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
+    if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+    if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+    if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+    if (opts && opts.filters) {
+      if ('authors' in opts.filters) {
+        if (Array.isArray(opts.filters.authors)) {
+          assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        }
+      }
+      if ('topics' in opts.filters) {
+        if (Array.isArray(opts.filters.topics)) {
+          assert(opts.filters.topics.every(v => typeof v === 'string'), 'Topics filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.topics === 'string', 'Topics filter must be a string or array of strings')
+        }
+      }
+      if ('visibility' in opts.filters) {
+        assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+      }
+    }
+    var comments = await commentsCrawler.list(opts)
+    return Promise.all(comments.map(massageCommentRecord))
+  },
+
+  /**
+   * @param {string} topic
+   * @param {Object} [opts]
+   * @param {Object} [opts.filters]
+   * @param {string|string[]} [opts.filters.authors]
+   * @param {string} [opts.filters.visibility]
+   * @param {string} [opts.parent]
+   * @param {number} [opts.depth]
+   * @param {string} [opts.sortBy]
+   * @param {boolean} [opts.reverse]
+   * @returns {Promise<CommentPublicAPIRecord[]>}
+   */
+  async thread (topic, opts) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    opts = (opts && typeof opts === 'object') ? opts : {}
+    assert(topic && typeof topic === 'string', 'The `topic` parameter must be a URL string')
+    if (opts && 'parent' in opts) assert(typeof opts.parent === 'string', 'Parent must be a string')
+    if (opts && 'depth' in opts) assert(typeof opts.depth === 'number', 'Depth must be a number')
+    if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
+    if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+    if (opts && opts.filters) {
+      if ('authors' in opts.filters) {
+        if (Array.isArray(opts.filters.authors)) {
+          assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        }
+      }
+      if ('visibility' in opts.filters) {
+        assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+      }
+    }
+    var comments = await commentsCrawler.thread(topic, opts)
+    return Promise.all(comments.map(massageThreadedCommentRecord))
+  },
+
+  /**
+   * @param {string} url
+   * @returns {Promise<CommentPublicAPIRecord>}
+   */
+  async get (url) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    return massageCommentRecord(await commentsCrawler.get(url))
+  },
+
+  /**
+   * @param {Object|string} comment
+   * @param {string} topic
+   * @param {string} comment.replyTo
+   * @param {string} comment.body
+   * @param {string} [comment.visibility]
+   * @returns {Promise<CommentPublicAPIRecord>}
+   */
+  async add (topic, comment) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    var userArchive = getUserArchive(this.sender)
+
+    // string usage
+    if (typeof comment === 'string') {
+      comment = {body: comment}
+    }
+
+    assert(topic && typeof topic === 'string', 'The `topic` parameter must be a URL string')
+    assert(comment && typeof comment === 'object', 'The `comment` parameter must be a string or object')
+    assert(comment.body && typeof comment.body === 'string', 'The `comment.body` parameter must be a non-empty string')
+    if ('replyTo' in comment) assert(typeof comment.replyTo === 'string', 'The `comment.replyTo` parameter must be a string')
+    if ('visibility' in comment) assert(typeof comment.visibility === 'string', 'The `comment.visibility` parameter must be "public" or "private"')
+
+    // default values
+    if (!comment.visibility) {
+      comment.visibility = 'public'
+    }
+
+    var url = await commentsCrawler.add(userArchive, topic, comment)
+    return massageCommentRecord(await commentsCrawler.get(url))
+  },
+
+  /**
+   * @param {string} url
+   * @param {Object|string} comment
+   * @param {string} comment.replyTo
+   * @param {string} comment.body
+   * @param {string} [comment.visibility]
+   * @returns {Promise<CommentPublicAPIRecord>}
+   */
+  async edit (url, comment) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    var userArchive = getUserArchive(this.sender)
+
+    // string usage
+    if (typeof comment === 'string') {
+      comment = {body: comment}
+    }
+
+    assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
+    assert(comment && typeof comment === 'object', 'The `comment` parameter must be a string or object')
+    if ('body' in comment) assert(typeof comment.body === 'string', 'The `comment.body` parameter must be a string')
+    if ('replyTo' in comment) assert(typeof comment.replyTo === 'string', 'The `comment.replyTo` parameter must be a string')
+    if ('visibility' in comment) assert(typeof comment.visibility === 'string', 'The `comment.visibility` parameter must be "public" or "private"')
+
+    var filepath = await urlToFilepath(url, userArchive.url)
+    await commentsCrawler.edit(userArchive, filepath, comment)
+    return massageCommentRecord(await commentsCrawler.get(userArchive.url + filepath))
+  },
+
+  /**
+   * @param {string} url
+   * @returns {Promise<void>}
+   */
+  async delete (url) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    var userArchive = getUserArchive(this.sender)
+
+    assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
+
+    var filepath = await urlToFilepath(url, userArchive.url)
+    await commentsCrawler.delete(userArchive, filepath)
+  }
+}
+
+// internal methods
+// =
+
+async function assertPermission (sender, perm) {
+  if (sender.getURL().startsWith('beaker:')) {
+    return true
+  }
+  if (await globals.permsAPI.requestPermission(perm, sender)) return true
+  throw new PermissionsError()
+}
+
+function getUserArchive (sender) {
+  var userSession = globals.userSessionAPI.getFor(sender)
+  if (!userSession) throw new Error('No active user session')
+  return dat.library.getArchive(userSession.url)
+}
+
+/**
+ * Tries to parse the URL and return the pathname. If fails, assumes the string was a pathname.
+ * @param {string} url
+ * @returns {Promise<string>}
+ */
+async function urlToFilepath (url, origin) {
+  var urlp
+  var filepath
+  try {
+    // if `url` is a full URL, extract the path
+    urlp = new URL(url)
+    filepath = urlp.pathname
+  } catch (e) {
+    // assume `url` is a path
+    return url
+  }
+
+  // double-check the origin
+  var key = await dat.dns.resolveName(urlp.hostname)
+  var urlp2 = new URL(origin)
+  if (key !== urlp2.hostname) {
+    throw new Error('Unable to edit comments on other sites than your own')
+  }
+
+  return filepath
+}
+
+/**
+ * @param {Object} comment
+ * @returns {CommentPublicAPIRecord}
+ */
+function massageCommentRecord (comment) {
+  if (!comment) return null
+  var url =  comment.author.url + comment.pathname
+  return {
+    url,
+    topic: comment.topic,
+    replyTo: comment.replyTo,
+    body: comment.body,
+    createdAt: comment.createdAt,
+    updatedAt: comment.updatedAt,
+    author: {
+      url: comment.author.url,
+      title: comment.author.title,
+      description: comment.author.description,
+      type: comment.author.type
+    },
+    visibility: comment.visibility
+  }
+}
+
+/**
+ * @param {Object} comment
+ * @returns {ThreadedCommentPublicAPIRecord}
+ */
+function massageThreadedCommentRecord (comment) {
+  if (!comment) return null
+  var url =  comment.author.url + comment.pathname
+  return {
+    url,
+    topic: comment.topic,
+    replyTo: comment.replyTo,
+    body: comment.body,
+    replies: comment.replies,
+    replyCount: comment.replyCount,
+    createdAt: comment.createdAt,
+    updatedAt: comment.updatedAt,
+    author: {
+      url: comment.author.url,
+      title: comment.author.title,
+      description: comment.author.description,
+      type: comment.author.type
+    },
+    visibility: comment.visibility
+  }
+}
diff --git a/web-apis/bg/unwalled-garden-posts.js b/web-apis/bg/unwalled-garden-posts.js
index 79e7aa65..28b98401 100644
--- a/web-apis/bg/unwalled-garden-posts.js
+++ b/web-apis/bg/unwalled-garden-posts.js
@@ -78,7 +78,6 @@ module.exports = {
    * @returns {Promise<PostPublicAPIRecord>}
    */
   async add (post) {
-    console.log('add()', post)
     await assertPermission(this.sender, 'dangerousAppControl')
     var userArchive = getUserArchive(this.sender)
 
diff --git a/web-apis/fg/navigator-import.js b/web-apis/fg/navigator-import.js
index 3a8d2aee..cd59af70 100644
--- a/web-apis/fg/navigator-import.js
+++ b/web-apis/fg/navigator-import.js
@@ -28,6 +28,10 @@ const APIs = {
     manifest: require('../manifests/external/search'),
     create: makeCreateFn('search')
   },
+  'unwalled-garden-comments': {
+    manifest: require('../manifests/external/unwalled-garden-comments'),
+    create: makeCreateFn('unwalled-garden-comments')
+  },
   'unwalled-garden-posts': {
     manifest: require('../manifests/external/unwalled-garden-posts'),
     create: makeCreateFn('unwalled-garden-posts')
diff --git a/web-apis/manifests/external/unwalled-garden-comments.js b/web-apis/manifests/external/unwalled-garden-comments.js
new file mode 100644
index 00000000..b506cbbd
--- /dev/null
+++ b/web-apis/manifests/external/unwalled-garden-comments.js
@@ -0,0 +1,8 @@
+module.exports = {
+  list: 'promise',
+  thread: 'promise',
+  get: 'promise',
+  add: 'promise',
+  edit: 'promise',
+  delete: 'promise'
+}
\ No newline at end of file

From 94971095d6a01802fc9ce263adbdf344846f85c5 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 17 Jun 2019 10:47:06 -0500
Subject: [PATCH 179/245] Unify web api semantics: delete -> remove

---
 crawler/comments.js                           |  4 +--
 crawler/posts.js                              |  4 +--
 crawler/reactions.js                          |  2 +-
 package-lock.json                             | 36 +++++++++----------
 package.json                                  |  4 +--
 web-apis/bg/unwalled-garden-comments.js       |  4 +--
 web-apis/bg/unwalled-garden-posts.js          |  4 +--
 web-apis/bg/unwalled-garden-reactions.js      |  4 +--
 .../external/unwalled-garden-comments.js      |  2 +-
 .../external/unwalled-garden-posts.js         |  2 +-
 .../external/unwalled-garden-reactions.js     |  2 +-
 11 files changed, 34 insertions(+), 34 deletions(-)

diff --git a/crawler/comments.js b/crawler/comments.js
index 9b8b06d5..e5859d94 100644
--- a/crawler/comments.js
+++ b/crawler/comments.js
@@ -443,8 +443,8 @@ exports.edit = async function (archive, pathname, comment) {
  * @param {string} pathname - the pathname of the comment.
  * @returns {Promise<void>}
  */
-exports.delete = async function (archive, pathname) {
-  assert(typeof pathname === 'string', 'Delete() must be provided a valid URL string')
+exports.remove = async function (archive, pathname) {
+  assert(typeof pathname === 'string', 'Remove() must be provided a valid URL string')
   await archive.pda.unlink(pathname)
   await crawler.crawlSite(archive)
 }
diff --git a/crawler/posts.js b/crawler/posts.js
index cff13c72..7a27ba1f 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -305,8 +305,8 @@ exports.edit = async function (archive, pathname, post) {
  * @param {string} pathname - the pathname of the post.
  * @returns {Promise<void>}
  */
-exports.delete = async function (archive, pathname) {
-  assert(typeof pathname === 'string', 'Delete() must be provided a valid URL string')
+exports.remove = async function (archive, pathname) {
+  assert(typeof pathname === 'string', 'Remove() must be provided a valid URL string')
   await archive.pda.unlink(pathname)
   await crawler.crawlSite(archive)
 }
diff --git a/crawler/reactions.js b/crawler/reactions.js
index 08eb97d3..4a823d65 100644
--- a/crawler/reactions.js
+++ b/crawler/reactions.js
@@ -294,7 +294,7 @@ exports.add = async function (archive, topic, emoji) {
  * @param {string} emoji
  * @returns {Promise<void>}
  */
-exports.delete = async function (archive, topic, emoji) {
+exports.remove = async function (archive, topic, emoji) {
   // TODO handle visibility
 
   emoji = emoji.replace('\uFE0F', '').replace('\uFE0E', '') // strip the emoji-enforcement token
diff --git a/package-lock.json b/package-lock.json
index 26cee3a8..a6e7d6b1 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -1735,9 +1735,9 @@
       }
     },
     "fs-minipass": {
-      "version": "1.2.5",
-      "resolved": "https://registry.npmjs.org/fs-minipass/-/fs-minipass-1.2.5.tgz",
-      "integrity": "sha512-JhBl0skXjUPCFH7x6x61gQxrKyXsxB5gcgePLZCwfyCGGsTISMoIeObbrvVeP6Xmyaudw4TT43qV2Gz+iyd2oQ==",
+      "version": "1.2.6",
+      "resolved": "https://registry.npmjs.org/fs-minipass/-/fs-minipass-1.2.6.tgz",
+      "integrity": "sha512-crhvyXcMejjv3Z5d2Fa9sf5xLYVCF5O1c71QxbVnbLsmYMBEvDAftewesN/HhY03YRoA7zOMxjNGrF5svGaaeQ==",
       "requires": {
         "minipass": "^2.2.1"
       }
@@ -2590,9 +2590,9 @@
       "integrity": "sha512-s5kLOcnH0XqDO+FvuaLX8DDjZ18CGFk7VygH40QoKPUQhW4e2rvM0rwUq0t8IQDOwYSeLK01U90OjzBTme2QqA=="
     },
     "knex": {
-      "version": "0.17.5",
-      "resolved": "https://registry.npmjs.org/knex/-/knex-0.17.5.tgz",
-      "integrity": "sha512-2BUau9Mg7vE+Isl2MfRhw+XtusTdAj9K5dSzor4N1yxHMLCfvPLIEY7Gmyq4QIz51cLRBNoQETyygdCE9BOmxw==",
+      "version": "0.17.6",
+      "resolved": "https://registry.npmjs.org/knex/-/knex-0.17.6.tgz",
+      "integrity": "sha512-4SKp8jaBxqlEoaveenmpfnHEv5Kzo6/vhIj8UhW1srGw/FKqARTr+7Fv8C1C1qeVHDjv0coQWuUzN5eermHUsw==",
       "requires": {
         "@babel/polyfill": "^7.4.4",
         "@types/bluebird": "^3.5.27",
@@ -3668,9 +3668,9 @@
       "dev": true
     },
     "psl": {
-      "version": "1.1.31",
-      "resolved": "https://registry.npmjs.org/psl/-/psl-1.1.31.tgz",
-      "integrity": "sha512-/6pt4+C+T+wZUieKR620OpzN/LlnNKuWjy1iFLQ/UG35JqHlR/89MP1d96dUfkf6Dne3TuLQzOYEYshJ+Hx8mw=="
+      "version": "1.1.32",
+      "resolved": "https://registry.npmjs.org/psl/-/psl-1.1.32.tgz",
+      "integrity": "sha512-MHACAkHpihU/REGGPLj4sEfc/XKW2bheigvHO1dUqjaKigMp1C8+WLQYRGgeKFMsw5PMfegZcaN8IDXK/cD0+g=="
     },
     "pump": {
       "version": "3.0.0",
@@ -4301,9 +4301,9 @@
       "integrity": "sha1-BOaSb2YolTVPPdAVIDYzuFcpfiw="
     },
     "sqlite3": {
-      "version": "4.0.8",
-      "resolved": "https://registry.npmjs.org/sqlite3/-/sqlite3-4.0.8.tgz",
-      "integrity": "sha512-kgwHu4j10KhpCHtx//dejd/tVQot7jc3sw+Sn0vMuKOw0X00Ckyg9VceKgzPyGmmz+zEoYue9tOLriWTvYy0ww==",
+      "version": "4.0.9",
+      "resolved": "https://registry.npmjs.org/sqlite3/-/sqlite3-4.0.9.tgz",
+      "integrity": "sha512-IkvzjmsWQl9BuBiM4xKpl5X8WCR4w0AeJHRdobCdXZ8dT/lNc1XS6WqvY35N6+YzIIgzSBeY5prdFObID9F9tA==",
       "requires": {
         "nan": "^2.12.1",
         "node-pre-gyp": "^0.11.0",
@@ -4508,17 +4508,17 @@
       }
     },
     "tar": {
-      "version": "4.4.8",
-      "resolved": "https://registry.npmjs.org/tar/-/tar-4.4.8.tgz",
-      "integrity": "sha512-LzHF64s5chPQQS0IYBn9IN5h3i98c12bo4NCO7e0sGM2llXQ3p2FGC5sdENN4cTW48O915Sh+x+EXx7XW96xYQ==",
+      "version": "4.4.10",
+      "resolved": "https://registry.npmjs.org/tar/-/tar-4.4.10.tgz",
+      "integrity": "sha512-g2SVs5QIxvo6OLp0GudTqEf05maawKUxXru104iaayWA09551tFCTI8f1Asb4lPfkBr91k07iL4c11XO3/b0tA==",
       "requires": {
         "chownr": "^1.1.1",
         "fs-minipass": "^1.2.5",
-        "minipass": "^2.3.4",
-        "minizlib": "^1.1.1",
+        "minipass": "^2.3.5",
+        "minizlib": "^1.2.1",
         "mkdirp": "^0.5.0",
         "safe-buffer": "^5.1.2",
-        "yallist": "^3.0.2"
+        "yallist": "^3.0.3"
       }
     },
     "tarn": {
diff --git a/package.json b/package.json
index 2942d1d7..cf07f5c5 100644
--- a/package.json
+++ b/package.json
@@ -52,7 +52,7 @@
     "icojs": "^0.12.3",
     "identify-filetype": "^1.0.0",
     "into-stream": "^3.1.0",
-    "knex": "^0.17.5",
+    "knex": "^0.17.6",
     "lodash.debounce": "^4.0.8",
     "lodash.difference": "^4.5.0",
     "lodash.get": "^4.4.2",
@@ -83,7 +83,7 @@
     "sodium-signatures": "^2.1.1",
     "spellchecker": "github:beakerbrowser/node-spellchecker#ce6402cb062823587986f3cd38debd01ddf3bffb",
     "split2": "^2.2.0",
-    "sqlite3": "^4.0.6",
+    "sqlite3": "^4.0.9",
     "stream-throttle": "^0.1.3",
     "supports-sparse-files": "^1.0.2",
     "textextensions": "^2.4.0",
diff --git a/web-apis/bg/unwalled-garden-comments.js b/web-apis/bg/unwalled-garden-comments.js
index bf6866df..a3a78950 100644
--- a/web-apis/bg/unwalled-garden-comments.js
+++ b/web-apis/bg/unwalled-garden-comments.js
@@ -193,14 +193,14 @@ module.exports = {
    * @param {string} url
    * @returns {Promise<void>}
    */
-  async delete (url) {
+  async remove (url) {
     await assertPermission(this.sender, 'dangerousAppControl')
     var userArchive = getUserArchive(this.sender)
 
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
 
     var filepath = await urlToFilepath(url, userArchive.url)
-    await commentsCrawler.delete(userArchive, filepath)
+    await commentsCrawler.remove(userArchive, filepath)
   }
 }
 
diff --git a/web-apis/bg/unwalled-garden-posts.js b/web-apis/bg/unwalled-garden-posts.js
index 28b98401..65dc0e9d 100644
--- a/web-apis/bg/unwalled-garden-posts.js
+++ b/web-apis/bg/unwalled-garden-posts.js
@@ -129,14 +129,14 @@ module.exports = {
    * @param {string} url
    * @returns {Promise<void>}
    */
-  async delete (url) {
+  async remove (url) {
     await assertPermission(this.sender, 'dangerousAppControl')
     var userArchive = getUserArchive(this.sender)
 
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
 
     var filepath = await urlToFilepath(url, userArchive.url)
-    await postsCrawler.delete(userArchive, filepath)
+    await postsCrawler.remove(userArchive, filepath)
   }
 }
 
diff --git a/web-apis/bg/unwalled-garden-reactions.js b/web-apis/bg/unwalled-garden-reactions.js
index ebec0b0e..cc8337c7 100644
--- a/web-apis/bg/unwalled-garden-reactions.js
+++ b/web-apis/bg/unwalled-garden-reactions.js
@@ -138,14 +138,14 @@ module.exports = {
    * @param {string} emoji
    * @returns {Promise<void>}
    */
-  async delete (topic, emoji) {
+  async remove (topic, emoji) {
     await assertPermission(this.sender, 'dangerousAppControl')
     var userArchive = getUserArchive(this.sender)
 
     topic = normalizeTopicUrl(topic)
     assert(topic && typeof topic === 'string', 'The `topic` parameter must be a valid URL')
 
-    await reactionsCrawler.delete(userArchive, topic, emoji)
+    await reactionsCrawler.remove(userArchive, topic, emoji)
   }
 }
 
diff --git a/web-apis/manifests/external/unwalled-garden-comments.js b/web-apis/manifests/external/unwalled-garden-comments.js
index b506cbbd..146527db 100644
--- a/web-apis/manifests/external/unwalled-garden-comments.js
+++ b/web-apis/manifests/external/unwalled-garden-comments.js
@@ -4,5 +4,5 @@ module.exports = {
   get: 'promise',
   add: 'promise',
   edit: 'promise',
-  delete: 'promise'
+  remove: 'promise'
 }
\ No newline at end of file
diff --git a/web-apis/manifests/external/unwalled-garden-posts.js b/web-apis/manifests/external/unwalled-garden-posts.js
index ae73b73d..06aeb28a 100644
--- a/web-apis/manifests/external/unwalled-garden-posts.js
+++ b/web-apis/manifests/external/unwalled-garden-posts.js
@@ -3,5 +3,5 @@ module.exports = {
   get: 'promise',
   add: 'promise',
   edit: 'promise',
-  delete: 'promise'
+  remove: 'promise'
 }
\ No newline at end of file
diff --git a/web-apis/manifests/external/unwalled-garden-reactions.js b/web-apis/manifests/external/unwalled-garden-reactions.js
index c335fc2b..717c8ddb 100644
--- a/web-apis/manifests/external/unwalled-garden-reactions.js
+++ b/web-apis/manifests/external/unwalled-garden-reactions.js
@@ -2,5 +2,5 @@ module.exports = {
   list: 'promise',
   tabulate: 'promise',
   add: 'promise',
-  delete: 'promise'
+  remove: 'promise'
 }
\ No newline at end of file

From bcced892d6cf71efb7661c1391934b40d0b3457e Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 17 Jun 2019 10:57:45 -0500
Subject: [PATCH 180/245] Change the follows API to use a topic param instead
 of subject

---
 crawler/follows.js                     | 78 +++++++++++++-------------
 web-apis/bg/unwalled-garden-follows.js | 10 ++--
 2 files changed, 44 insertions(+), 44 deletions(-)

diff --git a/crawler/follows.js b/crawler/follows.js
index f01528b9..51eb5394 100644
--- a/crawler/follows.js
+++ b/crawler/follows.js
@@ -29,7 +29,7 @@ const JSON_PATH = '/data/follows.json'
  *
  * @typedef {Object} Follow
  * @prop {SiteDescription} author
- * @prop {SiteDescription} subject
+ * @prop {SiteDescription} topic
  * @prop {string} visibility
  */
 
@@ -91,7 +91,7 @@ exports.crawlSite = async function (archive, crawlSource) {
 
     // diff against the current follows
     var currentFollowObjects = await list({filters: {authors: archive.url}})
-    var currentFollows = currentFollowObjects.map(({subject}) => subject.url)
+    var currentFollows = currentFollowObjects.map(({topic}) => topic.url)
     var newFollows = followsJson.urls
     var adds = _difference(newFollows, currentFollows)
     var removes = _difference(currentFollows, newFollows)
@@ -139,7 +139,7 @@ exports.crawlSite = async function (archive, crawlSource) {
  * @param {Object} [opts]
  * @param {Object} [opts.filters]
  * @param {string|string[]} [opts.filters.authors]
- * @param {string|string[]} [opts.filters.subjects]
+ * @param {string|string[]} [opts.filters.topics]
  * @param {string} [opts.filters.visibility]
  * @param {string} [opts.sortBy]
  * @param {number} [opts.offset=0]
@@ -166,14 +166,14 @@ const list = exports.list = async function (opts) {
       }
       opts.filters.authors = opts.filters.authors.map(url => toOrigin(url))
     }
-    if ('subjects' in opts.filters) {
-      if (Array.isArray(opts.filters.subjects)) {
-        assert(opts.filters.subjects.every(v => typeof v === 'string'), 'Subjects filter must be a string or array of strings')
+    if ('topics' in opts.filters) {
+      if (Array.isArray(opts.filters.topics)) {
+        assert(opts.filters.topics.every(v => typeof v === 'string'), 'Topics filter must be a string or array of strings')
       } else {
-        assert(typeof opts.filters.subjects === 'string', 'Subjects filter must be a string or array of strings')
-        opts.filters.subjects = [opts.filters.subjects]
+        assert(typeof opts.filters.topics === 'string', 'Topics filter must be a string or array of strings')
+        opts.filters.topics = [opts.filters.topics]
       }
-      opts.filters.subjects = opts.filters.subjects.map(url => toOrigin(url))
+      opts.filters.topics = opts.filters.topics.map(url => toOrigin(url))
     }
     if ('visibility' in opts.filters) {
       assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
@@ -191,18 +191,18 @@ const list = exports.list = async function (opts) {
   if (opts && opts.filters && opts.filters.authors) {
     sql = sql.whereIn('crawl_sources.url', opts.filters.authors)
   }
-  if (opts && opts.filters && opts.filters.subjects) {
-    sql = sql.whereIn('crawl_follows.destUrl', opts.filters.subjects)
+  if (opts && opts.filters && opts.filters.topics) {
+    sql = sql.whereIn('crawl_follows.destUrl', opts.filters.topics)
   }
   var rows = await db.all(sql)
 
   // massage results
   return Promise.all(rows.map(async (row) => {
     var author = toOrigin(row.authorUrl)
-    var subject = toOrigin(row.destUrl)
+    var topic = toOrigin(row.destUrl)
     return {
       author: await siteDescriptions.getBest({subject: author}),
-      subject: await siteDescriptions.getBest({subject: subject}),
+      topic: await siteDescriptions.getBest({subject: topic}),
       visibility: 'public'
     }
   }))
@@ -213,22 +213,22 @@ const list = exports.list = async function (opts) {
  * Get an individual follow.
  *
  * @param {string} author - (URL) the site being queried.
- * @param {string} subject - (URL) does a follow this site?
+ * @param {string} topic - (URL) does a follow this site?
  * @returns {Promise<Follow>}
  */
-const get = exports.get = async function (author, subject) {
+const get = exports.get = async function (author, topic) {
   author = toOrigin(author)
-  subject = toOrigin(subject)
+  topic = toOrigin(topic)
   var res = await db.get(knex('crawl_follows')
     .select('crawl_follows.*')
     .select('crawl_sources.url AS authorUrl')
     .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_follows.crawlSourceId')
     .where('crawl_sources.url', author)
-    .where('crawl_follows.destUrl', subject))
+    .where('crawl_follows.destUrl', topic))
   if (!res) return null
   return {
     author: await siteDescriptions.getBest({subject: toOrigin(res.authorUrl)}),
-    subject: await siteDescriptions.getBest({subject: toOrigin(res.destUrl)}),
+    topic: await siteDescriptions.getBest({subject: toOrigin(res.destUrl)}),
     visibility: 'public'
   }
 }
@@ -238,27 +238,27 @@ const get = exports.get = async function (author, subject) {
  * Add a follow to the given archive.
  *
  * @param {InternalDatArchive} archive
- * @param {string} subject
+ * @param {string} topic
  * @param {Object} [opts]
  * @param {string} [opts.visibility]
  * @returns {Promise<void>}
  */
-exports.add = async function (archive, subject, opts) {
+exports.add = async function (archive, topic, opts) {
   // TODO visibility
 
-  // normalize subject
-  subject = toOrigin(subject)
-  assert(typeof subject === 'string', 'Follow() must be given a valid URL')
+  // normalize topic
+  topic = toOrigin(topic)
+  assert(typeof topic === 'string', 'Follow() must be given a valid URL')
 
   // write new follows.json
   await updateFollowsFile(archive, followsJson => {
-    if (!followsJson.urls.find(v => v === subject)) {
-      followsJson.urls.push(subject)
+    if (!followsJson.urls.find(v => v === topic)) {
+      followsJson.urls.push(topic)
     }
   })
 
   // capture site description
-  /* dont await */siteDescriptions.capture(archive, subject)
+  /* dont await */siteDescriptions.capture(archive, topic)
 }
 
 /**
@@ -266,22 +266,22 @@ exports.add = async function (archive, subject, opts) {
  * Edit a follow for the given archive.
  *
  * @param {InternalDatArchive} archive
- * @param {string} subject
+ * @param {string} topic
  * @param {Object} [opts]
  * @param {string} [opts.visibility]
  * @returns {Promise<void>}
  */
-exports.edit = async function (archive, subject, opts) {
+exports.edit = async function (archive, topic, opts) {
   // TODO visibility
 
-  // normalize subject
-  subject = toOrigin(subject)
-  assert(typeof subject === 'string', 'Follow() must be given a valid URL')
+  // normalize topic
+  topic = toOrigin(topic)
+  assert(typeof topic === 'string', 'Follow() must be given a valid URL')
 
   // write new follows.json
   await updateFollowsFile(archive, followsJson => {
-    if (!followsJson.urls.find(v => v === subject)) {
-      followsJson.urls.push(subject)
+    if (!followsJson.urls.find(v => v === topic)) {
+      followsJson.urls.push(topic)
     }
   })
 }
@@ -291,19 +291,19 @@ exports.edit = async function (archive, subject, opts) {
  * Remove a follow from the given archive.
  *
  * @param {InternalDatArchive} archive
- * @param {string} subject
+ * @param {string} topic
  * @returns {Promise<void>}
  */
-exports.remove = async function (archive, subject) {
+exports.remove = async function (archive, topic) {
   // TODO private follows
 
-  // normalize subject
-  subject = toOrigin(subject)
-  assert(typeof subject === 'string', 'Unfollow() must be given a valid URL')
+  // normalize topic
+  topic = toOrigin(topic)
+  assert(typeof topic === 'string', 'Unfollow() must be given a valid URL')
 
   // write new follows.json
   await updateFollowsFile(archive, followsJson => {
-    var i = followsJson.urls.findIndex(v => v === subject)
+    var i = followsJson.urls.findIndex(v => v === topic)
     if (i !== -1) {
       followsJson.urls.splice(i, 1)
     }
diff --git a/web-apis/bg/unwalled-garden-follows.js b/web-apis/bg/unwalled-garden-follows.js
index c33d601b..0a820b2c 100644
--- a/web-apis/bg/unwalled-garden-follows.js
+++ b/web-apis/bg/unwalled-garden-follows.js
@@ -29,7 +29,7 @@ module.exports = {
    * @param {Object} [opts]
    * @param {Object} [opts.filters]
    * @param {string|string[]} [opts.filters.authors]
-   * @param {string|string[]} [opts.filters.subjects]
+   * @param {string|string[]} [opts.filters.topics]
    * @param {string} [opts.filters.visibility]
    * @param {string} [opts.sortBy]
    * @param {number} [opts.offset=0]
@@ -52,11 +52,11 @@ module.exports = {
           assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
         }
       }
-      if ('subjects' in opts.filters) {
-        if (Array.isArray(opts.filters.subjects)) {
-          assert(opts.filters.subjects.every(v => typeof v === 'string'), 'Subjects filter must be a string or array of strings')
+      if ('topics' in opts.filters) {
+        if (Array.isArray(opts.filters.topics)) {
+          assert(opts.filters.topics.every(v => typeof v === 'string'), 'Topics filter must be a string or array of strings')
         } else {
-          assert(typeof opts.filters.subjects === 'string', 'Subjects filter must be a string or array of strings')
+          assert(typeof opts.filters.topics === 'string', 'Topics filter must be a string or array of strings')
         }
       }
       if ('visibility' in opts.filters) {

From c9c519cf728128425a22a30eca22f715221f5727 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 17 Jun 2019 15:17:28 -0500
Subject: [PATCH 181/245] Fix users query for followed users (subject -> topic)

---
 users/index.js | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/users/index.js b/users/index.js
index a8b2d370..6637b4f3 100644
--- a/users/index.js
+++ b/users/index.js
@@ -126,6 +126,7 @@ async function tick () {
     // await all crawls
     await Promise.all(activeCrawls)
   } catch (e) {
+    console.error(e)
     logger.error('Crawler tick failed', {details: e})
   }
 
@@ -250,11 +251,11 @@ async function selectNextCrawlTargets (user) {
   var rows = [user.url]
 
   // get followed sites
-  var followedUrls = (await followsCrawler.list({filters: {authors: user.url}})).map(({subject}) => subject.url)
+  var followedUrls = (await followsCrawler.list({filters: {authors: user.url}})).map(({topic}) => topic.url)
   rows = rows.concat(followedUrls)
 
   // get sites followed by followed sites
-  var foafUrls = (await followsCrawler.list({filters: {authors: followedUrls}})).map(({subject}) => subject.url)
+  var foafUrls = (await followsCrawler.list({filters: {authors: followedUrls}})).map(({topic}) => topic.url)
   rows = rows.concat(foafUrls)
 
   // assemble into list

From 56b2924f47344afe0eb9b5434b441ed8d229ad38 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 17 Jun 2019 15:24:49 -0500
Subject: [PATCH 182/245] Change crawled bookmarks to use denormalized tags

---
 crawler/bookmarks.js                | 94 ++++++++++++++---------------
 crawler/posts.js                    |  1 -
 dbs/profile-data-db.js              |  3 +-
 dbs/schemas/profile-data.sql.js     | 29 ++++++---
 dbs/schemas/profile-data.v28.sql.js | 60 ++++++++++++++++++
 users/index.js                      | 60 +++++++++---------
 6 files changed, 161 insertions(+), 86 deletions(-)
 create mode 100644 dbs/schemas/profile-data.v28.sql.js

diff --git a/crawler/bookmarks.js b/crawler/bookmarks.js
index 39d8fbf2..0f29868c 100644
--- a/crawler/bookmarks.js
+++ b/crawler/bookmarks.js
@@ -4,6 +4,7 @@ const Events = require('events')
 const Ajv = require('ajv')
 const logger = require('../logger').child({category: 'crawler', dataset: 'bookmarks'})
 const db = require('../dbs/profile-data-db')
+const knex = require('../lib/knex')
 const crawler = require('./index')
 const siteDescriptions = require('./site-descriptions')
 const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename, ensureDirectory} = require('./util')
@@ -12,7 +13,7 @@ const bookmarkSchema = require('./json-schemas/bookmark')
 // constants
 // =
 
-const TABLE_VERSION = 1
+const TABLE_VERSION = 2
 const JSON_TYPE = 'unwalled.garden/bookmark'
 const JSON_PATH_REGEX = /^\/data\/bookmarks\/([^/]+)\.json$/i
 
@@ -122,24 +123,23 @@ exports.crawlSite = async function (archive, crawlSource) {
         if (isNaN(bookmark.updatedAt)) bookmark.updatedAt = 0 // optional
         if (!bookmark.content.description) bookmark.content.description = '' // optional
         if (!bookmark.content.tags) bookmark.content.tags = [] // optional
-        bookmark.content.tags = bookmark.content.tags.join(' ')
 
         // upsert
         let existingBookmark = await getBookmark(joinPath(archive.url, changedBookmark.name))
         if (existingBookmark) {
-          await db.run(`
-            UPDATE crawl_bookmarks
-              SET crawledAt = ?, href = ?, title = ?, description = ?, tags = ?, createdAt = ?, updatedAt = ?
-              WHERE crawlSourceId = ? AND pathname = ?
-          `, [Date.now(), bookmark.content.href, bookmark.content.title, bookmark.content.description, bookmark.content.tags, bookmark.createdAt, bookmark.updatedAt, crawlSource.id, changedBookmark.name])
-          events.emit('bookmark-updated', archive.url)
-        } else {
-          await db.run(`
-            INSERT INTO crawl_bookmarks (crawlSourceId, pathname, crawledAt, href, title, description, tags, createdAt, updatedAt)
-              VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?)
-          `, [crawlSource.id, changedBookmark.name, Date.now(), bookmark.content.href, bookmark.content.title, bookmark.content.description, bookmark.content.tags, bookmark.createdAt, bookmark.updatedAt])
-          events.emit('bookmark-added', archive.url)
+          await db.run(`DELETE FROM crawl_bookmarks WHERE crawlSourceId = ? and pathname = ?`, [crawlSource.id, changedBookmark.name])
         }
+        let res = await db.run(`
+          INSERT INTO crawl_bookmarks (crawlSourceId, pathname, crawledAt, href, title, description, createdAt, updatedAt)
+            VALUES (?, ?, ?, ?, ?, ?, ?, ?)
+        `, [crawlSource.id, changedBookmark.name, Date.now(), bookmark.content.href, bookmark.content.title, bookmark.content.description, bookmark.createdAt, bookmark.updatedAt])
+        var bookmarkId = res.lastID
+        for (let tag of bookmark.content.tags) {
+          await db.run(`INSERT OR IGNORE INTO crawl_tags (tag) VALUES (?)`, [tag])
+          let tagRow = await db.get(`SELECT id FROM crawl_tags WHERE tag = ?`, [tag])
+          await db.run(`INSERT INTO crawl_bookmarks_tags (crawlBookmarkId, crawlTagId) VALUES (?, ?)`, [bookmarkId, tagRow.id])
+        }
+        events.emit('bookmark-added', archive.url)
       }
 
       // checkpoint our progress
@@ -163,6 +163,8 @@ exports.crawlSite = async function (archive, crawlSource) {
  * @returns {Promise<Array<Bookmark>>}
  */
 exports.query = async function (opts) {
+  // TODO tags filter
+
   // validate & parse params
   if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
   if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
@@ -180,34 +182,23 @@ exports.query = async function (opts) {
   }
 
   // build query
-  var query = `
-    SELECT crawl_bookmarks.*, src.url AS crawlSourceUrl FROM crawl_bookmarks
-      INNER JOIN crawl_sources src ON src.id = crawl_bookmarks.crawlSourceId
-  `
-  var values = []
+  var sql = knex('crawl_bookmarks')
+    .select('crawl_bookmarks.*')
+    .select('crawl_sources.url as crawlSourceUrl')
+    .select(knex.raw('group_concat(crawl_tags.tag, ",") as tags'))
+    .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_bookmarks.crawlSourceId')
+    .leftJoin('crawl_bookmarks_tags', 'crawl_bookmarks_tags.crawlBookmarkId', '=', 'crawl_bookmarks.id')
+    .leftJoin('crawl_tags', 'crawl_bookmarks_tags.crawlTagId', '=', 'crawl_tags.id')
+    .groupBy('crawl_bookmarks.id')
+    .orderBy('crawl_bookmarks.createdAt', opts.reverse ? 'DESC' : 'ASC')
   if (opts && opts.filters && opts.filters.authors) {
-    let op = 'WHERE'
-    for (let a of opts.filters.authors) {
-      query += ` ${op} src.url = ?`
-      op = 'OR'
-      values.push(a)
-    }
-  }
-  query += ` ORDER BY createdAt`
-  if (opts && opts.reverse) {
-    query += ` DESC`
-  }
-  if (opts && opts.limit) {
-    query += ` LIMIT ?`
-    values.push(opts.limit)
-  }
-  if (opts && opts.offset) {
-    query += ` OFFSET ?`
-    values.push(opts.offset)
+    sql = sql.whereIn('crawl_sources.url', opts.filters.authors)
   }
+  if (opts && opts.limit) sql = sql.limit(opts.limit)
+  if (opts && opts.offset) sql = sql.offset(opts.offset)
 
   // execute query
-  var rows = await db.all(query, values)
+  var rows = await db.all(sql)
   return Promise.all(rows.map(massageBookmarkRow))
 }
 
@@ -226,17 +217,22 @@ const getBookmark = exports.getBookmark = async function (url) {
     catch (e) { throw new Error('Invalid URL: ' + url) }
   }
 
+  // build query
+  var sql = knex('crawl_bookmarks')
+    .select('crawl_bookmarks.*')
+    .select('crawl_sources.url as crawlSourceUrl')
+    .select(knex.raw('group_concat(crawl_tags.tag, ",") as tags'))
+    .innerJoin('crawl_sources', function () {
+      this.on('crawl_sources.id', '=', 'crawl_bookmarks.crawlSourceId')
+        .andOn('crawl_sources.url', '=', knex.raw('?', `${urlParsed.protocol}//${urlParsed.hostname}`))
+    })
+    .leftJoin('crawl_bookmarks_tags', 'crawl_bookmarks_tags.crawlBookmarkId', '=', 'crawl_bookmarks.id')
+    .leftJoin('crawl_tags', 'crawl_tags.id', '=', 'crawl_bookmarks_tags.crawlTagId')
+    .where('crawl_bookmarks.pathname', urlParsed.pathname)
+    .groupBy('crawl_bookmarks.id')
+
   // execute query
-  return await massageBookmarkRow(await db.get(`
-    SELECT
-        crawl_bookmarks.*, src.url AS crawlSourceUrl
-      FROM crawl_bookmarks
-      INNER JOIN crawl_sources src
-        ON src.id = crawl_bookmarks.crawlSourceId
-        AND src.url = ?
-      WHERE
-        crawl_bookmarks.pathname = ?
-  `, [`${urlParsed.protocol}//${urlParsed.hostname}`, urlParsed.pathname]))
+  return await massageBookmarkRow(await db.get(sql))
 }
 
 /**
@@ -365,7 +361,7 @@ async function massageBookmarkRow (row) {
       href: row.href,
       title: row.title,
       description: row.description,
-      tags: row.tags.split(' ').filter(Boolean)
+      tags: row.tags ? row.tags.split(',').filter(Boolean) : []
     },
     crawledAt: row.crawledAt,
     createdAt: row.createdAt,
diff --git a/crawler/posts.js b/crawler/posts.js
index 7a27ba1f..303bf91a 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -188,7 +188,6 @@ exports.list = async function (opts) {
     .select('crawl_sources.url AS crawlSourceUrl')
     .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_posts.crawlSourceId')
     .orderBy('crawl_posts.createdAt', opts.reverse ? 'DESC' : 'ASC')
-  var values = []
   if (opts && opts.filters && opts.filters.authors) {
     sql = sql.whereIn('crawl_sources.url', opts.filters.authors)
   }
diff --git a/dbs/profile-data-db.js b/dbs/profile-data-db.js
index c11dbd2e..1e9531b4 100644
--- a/dbs/profile-data-db.js
+++ b/dbs/profile-data-db.js
@@ -114,7 +114,8 @@ migrations = [
   migration('profile-data.v24.sql'),
   migration('profile-data.v25.sql'),
   migration('profile-data.v26.sql'),
-  migration('profile-data.v27.sql')
+  migration('profile-data.v27.sql'),
+  migration('profile-data.v28.sql')
 ]
 function migration (file, opts = {}) {
   return cb => {
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index 523f55d9..869fb916 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -157,6 +157,12 @@ CREATE TRIGGER crawl_site_descriptions_au AFTER UPDATE ON crawl_site_description
   INSERT INTO crawl_site_descriptions_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
 END;
 
+-- crawled tags
+CREATE TABLE crawl_tags (
+  id INTEGER PRIMARY KEY,
+  tag TEXT UNIQUE
+);
+
 -- crawled posts
 CREATE TABLE crawl_posts (
   crawlSourceId INTEGER NOT NULL,
@@ -228,6 +234,7 @@ CREATE INDEX crawl_reactions_topic ON crawl_reactions (topic);
 
 -- crawled bookmarks
 CREATE TABLE crawl_bookmarks (
+  id INTEGER PRIMARY KEY,
   crawlSourceId INTEGER NOT NULL,
   pathname TEXT NOT NULL,
   crawledAt INTEGER,
@@ -235,26 +242,34 @@ CREATE TABLE crawl_bookmarks (
   href TEXT,
   title TEXT,
   description TEXT,
-  tags TEXT,
   createdAt INTEGER,
   updatedAt INTEGER,
 
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
-CREATE VIRTUAL TABLE crawl_bookmarks_fts_index USING fts5(title, description, tags, content='crawl_bookmarks');
+CREATE VIRTUAL TABLE crawl_bookmarks_fts_index USING fts5(title, description, content='crawl_bookmarks');
 
 -- triggers to keep crawl_bookmarks_fts_index updated
 CREATE TRIGGER crawl_bookmarks_ai AFTER INSERT ON crawl_bookmarks BEGIN
-  INSERT INTO crawl_bookmarks_fts_index(rowid, title, description, tags) VALUES (new.rowid, new.title, new.description, new.tags);
+  INSERT INTO crawl_bookmarks_fts_index(id, title, description) VALUES (new.id, new.title, new.description);
 END;
 CREATE TRIGGER crawl_bookmarks_ad AFTER DELETE ON crawl_bookmarks BEGIN
-  INSERT INTO crawl_bookmarks_fts_index(crawl_bookmarks_fts_index, rowid, title, description, tags) VALUES('delete', old.rowid, old.title, old.description, old.tags);
+  INSERT INTO crawl_bookmarks_fts_index(crawl_bookmarks_fts_index, id, title, description) VALUES('delete', old.id, old.title, old.description);
 END;
 CREATE TRIGGER crawl_bookmarks_au AFTER UPDATE ON crawl_bookmarks BEGIN
-  INSERT INTO crawl_bookmarks_fts_index(crawl_bookmarks_fts_index, rowid, title, description, tags) VALUES('delete', old.rowid, old.title, old.description, old.tags);
-  INSERT INTO crawl_bookmarks_fts_index(rowid, title, description, tags) VALUES (new.rowid, new.title, new.description, new.tags);
+  INSERT INTO crawl_bookmarks_fts_index(crawl_bookmarks_fts_index, id, title, description) VALUES('delete', old.id, old.title, old.description);
+  INSERT INTO crawl_bookmarks_fts_index(id, title, description) VALUES (new.id, new.title, new.description);
 END;
 
+-- crawled bookmark tags
+CREATE TABLE crawl_bookmarks_tags (
+  crawlBookmarkId INTEGER,
+  crawlTagId INTEGER,
+
+  FOREIGN KEY (crawlBookmarkId) REFERENCES crawl_bookmarks (id) ON DELETE CASCADE,
+  FOREIGN KEY (crawlTagId) REFERENCES crawl_tags (id) ON DELETE CASCADE
+);
+
 -- crawled follows
 CREATE TABLE crawl_follows (
   crawlSourceId INTEGER NOT NULL,
@@ -329,5 +344,5 @@ INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Library', 'beaker://library/', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker.Social', 'dat://beaker.social', 1);
 
-PRAGMA user_version = 27;
+PRAGMA user_version = 28;
 `
diff --git a/dbs/schemas/profile-data.v28.sql.js b/dbs/schemas/profile-data.v28.sql.js
new file mode 100644
index 00000000..0bc4e110
--- /dev/null
+++ b/dbs/schemas/profile-data.v28.sql.js
@@ -0,0 +1,60 @@
+module.exports = `
+
+-- we're replacing the bookmark 'tags' field with a new normalized tags table
+-- this requires replacing the entire bookmarks table because we need to add an id pkey
+
+
+-- remove the old bookmarks tabes
+DROP TRIGGER crawl_bookmarks_ai;
+DROP TRIGGER crawl_bookmarks_ad;
+DROP TRIGGER crawl_bookmarks_au;
+DROP TABLE crawl_bookmarks_fts_index;
+DROP TABLE crawl_bookmarks;
+
+
+-- add crawled tags
+CREATE TABLE crawl_tags (
+  id INTEGER PRIMARY KEY,
+  tag TEXT UNIQUE
+);
+
+-- add crawled bookmarks
+CREATE TABLE crawl_bookmarks (
+  id INTEGER PRIMARY KEY,
+  crawlSourceId INTEGER NOT NULL,
+  pathname TEXT NOT NULL,
+  crawledAt INTEGER,
+
+  href TEXT,
+  title TEXT,
+  description TEXT,
+  createdAt INTEGER,
+  updatedAt INTEGER,
+
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+CREATE VIRTUAL TABLE crawl_bookmarks_fts_index USING fts5(title, description, content='crawl_bookmarks');
+
+-- triggers to keep crawl_bookmarks_fts_index updated
+CREATE TRIGGER crawl_bookmarks_ai AFTER INSERT ON crawl_bookmarks BEGIN
+  INSERT INTO crawl_bookmarks_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
+END;
+CREATE TRIGGER crawl_bookmarks_ad AFTER DELETE ON crawl_bookmarks BEGIN
+  INSERT INTO crawl_bookmarks_fts_index(crawl_bookmarks_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
+END;
+CREATE TRIGGER crawl_bookmarks_au AFTER UPDATE ON crawl_bookmarks BEGIN
+  INSERT INTO crawl_bookmarks_fts_index(crawl_bookmarks_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
+  INSERT INTO crawl_bookmarks_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
+END;
+
+-- add bookmark <-> tag join table
+CREATE TABLE crawl_bookmarks_tags (
+  crawlBookmarkId INTEGER,
+  crawlTagId INTEGER,
+
+  FOREIGN KEY (crawlBookmarkId) REFERENCES crawl_bookmarks (id) ON DELETE CASCADE,
+  FOREIGN KEY (crawlTagId) REFERENCES crawl_tags (id) ON DELETE CASCADE
+);
+
+PRAGMA user_version = 28;
+`
diff --git a/users/index.js b/users/index.js
index 6637b4f3..f4ab8299 100644
--- a/users/index.js
+++ b/users/index.js
@@ -344,33 +344,37 @@ function watchThumb (user) {
  * @returns {void}
  */
 function watchAndSyncBookmarks (user) {
-  // TODO support multiple users
-  syncBookmarks()
-  bookmarksDb.on('changed', syncBookmarks)
-
-  function pickBookmarkAttrs (b) {
-    return _pick(b, ['href', 'title', 'description', 'tags'])
-  }
+  // DISABLED
+  // we're going to replace this with a purely FS based bookmarking system
+  // -prf
 
-  async function syncBookmarks () {
-    // fetch current public bookmarks
-    var publicBookmarks = await bookmarksDb.listBookmarks(0, {filters: {isPublic: true}})
-    var publishedBookmarks = await bookmarksCrawler.query({filters: {authors: user.url}})
-
-    // diff and publish changes
-    for (let b of publicBookmarks) {
-      let existing = publishedBookmarks.find(b2 => b.href === b2.content.href)
-      if (!existing) {
-        await bookmarksCrawler.addBookmark(user.archive, pickBookmarkAttrs(b)) // add
-      } else {
-        if (!_isEqual(pickBookmarkAttrs(b), existing.content)) {
-          await bookmarksCrawler.editBookmark(user.archive, existing.pathname, pickBookmarkAttrs(b)) // update
-        }
-      }
-    }
-    for (let b of publishedBookmarks) {
-      let existing = publicBookmarks.find(b2 => b2.href === b.content.href)
-      if (!existing) await bookmarksCrawler.deleteBookmark(user.archive, b.pathname) // remove
-    }
-  }
+  // TODO support multiple users
+  // syncBookmarks()
+  // bookmarksDb.on('changed', syncBookmarks)
+
+  // function pickBookmarkAttrs (b) {
+  //   return _pick(b, ['href', 'title', 'description', 'tags'])
+  // }
+
+  // async function syncBookmarks () {
+  //   // fetch current public bookmarks
+  //   var publicBookmarks = await bookmarksDb.listBookmarks(0, {filters: {isPublic: true}})
+  //   var publishedBookmarks = await bookmarksCrawler.query({filters: {authors: user.url}})
+
+  //   // diff and publish changes
+  //   for (let b of publicBookmarks) {
+  //     let existing = publishedBookmarks.find(b2 => b.href === b2.content.href)
+  //     if (!existing) {
+  //       await bookmarksCrawler.addBookmark(user.archive, pickBookmarkAttrs(b)) // add
+  //     } else {
+  //       if (!_isEqual(pickBookmarkAttrs(b), existing.content)) {
+  //         await bookmarksCrawler.editBookmark(user.archive, existing.pathname, pickBookmarkAttrs(b)) // update
+  //       }
+  //     }
+  //   }
+  //   for (let b of publishedBookmarks) {
+  //     let existing = publicBookmarks.find(b2 => b2.href === b.content.href)
+  //     if (!existing) await bookmarksCrawler.deleteBookmark(user.archive, b.pathname) // remove
+  //   }
+  // }
 }
\ No newline at end of file

From 5b56cee8bb6e874f6da9de98d75d3b8d3dba0b2b Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 17 Jun 2019 15:45:26 -0500
Subject: [PATCH 183/245] Update some search queries

---
 crawler/search.js | 10 +++-------
 1 file changed, 3 insertions(+), 7 deletions(-)

diff --git a/crawler/search.js b/crawler/search.js
index c88448f9..ba249680 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -72,7 +72,6 @@ const BUILTIN_PAGES = [
  * @prop {string} content.href
  * @prop {string} content.title
  * @prop {string} content.description
- * @prop {string[]} content.tags
  * @prop {number} createdAt
  * @prop {number} updatedAt
  */
@@ -98,8 +97,8 @@ exports.listSuggestions = async function (user, query = '', opts = {}) {
   suggestions.builtins = BUILTIN_PAGES.filter(a => query ? a.title.toLowerCase().includes(query) : true)
 
   // addressbook
-  suggestions.addressbook = (await follows.list({filters: {authors: user}})).map(({subject}) => subject)
-  suggestions.addressbook = [await siteDescriptions.getBest({subject: user, author: user})].concat(suggestions.addressbook)
+  suggestions.addressbook = (await follows.list({filters: {authors: user}})).map(({topic}) => topic)
+  suggestions.addressbook = [await siteDescriptions.getBest({topic: user, author: user})].concat(suggestions.addressbook)
   suggestions.addressbook = suggestions.addressbook.filter(filterFn)
 
   // bookmarks
@@ -340,7 +339,6 @@ function buildBookmarksSearchQuery ({query, crawlSourceIds, userCrawlSourceId, s
       .select('crawl_bookmarks.href')
       .select(knex.raw(`SNIPPET(crawl_bookmarks_fts_index, 0, '${startHighlight}', '${endHighlight}', '...', 25) AS title`))
       .select(knex.raw(`SNIPPET(crawl_bookmarks_fts_index, 1, '${startHighlight}', '${endHighlight}', '...', 25) AS description`))
-      .select(knex.raw(`SNIPPET(crawl_bookmarks_fts_index, 2, '${startHighlight}', '${endHighlight}', '...', 25) AS tags`))
       .innerJoin('crawl_bookmarks', 'crawl_bookmarks.rowid', '=', 'crawl_bookmarks_fts_index.rowid')
       .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_bookmarks.crawlSourceId')
       .leftJoin('crawl_follows', 'crawl_follows.destUrl', '=', 'crawl_sources.url')
@@ -350,7 +348,6 @@ function buildBookmarksSearchQuery ({query, crawlSourceIds, userCrawlSourceId, s
       .select('crawl_bookmarks.href')
       .select('crawl_bookmarks.title')
       .select('crawl_bookmarks.description')
-      .select('crawl_bookmarks.tags')
       .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_bookmarks.crawlSourceId')
       .leftJoin('crawl_follows', 'crawl_follows.destUrl', '=', 'crawl_sources.url')
   }
@@ -440,8 +437,7 @@ async function massageBookmarkSearchResult (row) {
     content: {
       href: row.href,
       title: row.title,
-      description: row.description,
-      tags: row.tags.split(' ')
+      description: row.description
     },
     createdAt: row.createdAt,
     updatedAt: row.updatedAt

From ac10df9825b65ee48ea949c41b03754de34477a2 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 17 Jun 2019 15:57:10 -0500
Subject: [PATCH 184/245] Update bookmark unwalled-garden schema away from
 .content field

---
 crawler/bookmarks.js             | 99 +++++++++++++++++---------------
 crawler/json-schemas/bookmark.js | 84 +++++++++++++--------------
 web-apis/bg/bookmarks.js         | 30 +++++++---
 3 files changed, 114 insertions(+), 99 deletions(-)

diff --git a/crawler/bookmarks.js b/crawler/bookmarks.js
index 0f29868c..2985f481 100644
--- a/crawler/bookmarks.js
+++ b/crawler/bookmarks.js
@@ -13,7 +13,7 @@ const bookmarkSchema = require('./json-schemas/bookmark')
 // constants
 // =
 
-const TABLE_VERSION = 2
+const TABLE_VERSION = 3
 const JSON_TYPE = 'unwalled.garden/bookmark'
 const JSON_PATH_REGEX = /^\/data\/bookmarks\/([^/]+)\.json$/i
 
@@ -27,11 +27,10 @@ const JSON_PATH_REGEX = /^\/data\/bookmarks\/([^/]+)\.json$/i
  *
  * @typedef {Object} Bookmark
  * @prop {string} pathname
- * @prop {Object} content
- * @prop {string} content.href
- * @prop {string} content.title
- * @prop {string?} content.description
- * @prop {string[]?} content.tags
+ * @prop {string} href
+ * @prop {string} title
+ * @prop {string?} description
+ * @prop {string[]?} tags
  * @prop {number} crawledAt
  * @prop {number} createdAt
  * @prop {number} updatedAt
@@ -44,7 +43,6 @@ const JSON_PATH_REGEX = /^\/data\/bookmarks\/([^/]+)\.json$/i
 const events = new Events()
 const ajv = (new Ajv())
 const validateBookmark = ajv.compile(bookmarkSchema)
-const validateBookmarkContent = ajv.compile(bookmarkSchema.properties.content)
 
 // exported api
 // =
@@ -121,8 +119,8 @@ exports.crawlSite = async function (archive, crawlSource) {
         bookmark.createdAt = Number(new Date(bookmark.createdAt))
         bookmark.updatedAt = Number(new Date(bookmark.updatedAt))
         if (isNaN(bookmark.updatedAt)) bookmark.updatedAt = 0 // optional
-        if (!bookmark.content.description) bookmark.content.description = '' // optional
-        if (!bookmark.content.tags) bookmark.content.tags = [] // optional
+        if (!bookmark.description) bookmark.description = '' // optional
+        if (!bookmark.tags) bookmark.tags = [] // optional
 
         // upsert
         let existingBookmark = await getBookmark(joinPath(archive.url, changedBookmark.name))
@@ -132,9 +130,9 @@ exports.crawlSite = async function (archive, crawlSource) {
         let res = await db.run(`
           INSERT INTO crawl_bookmarks (crawlSourceId, pathname, crawledAt, href, title, description, createdAt, updatedAt)
             VALUES (?, ?, ?, ?, ?, ?, ?, ?)
-        `, [crawlSource.id, changedBookmark.name, Date.now(), bookmark.content.href, bookmark.content.title, bookmark.content.description, bookmark.createdAt, bookmark.updatedAt])
+        `, [crawlSource.id, changedBookmark.name, Date.now(), bookmark.href, bookmark.title, bookmark.description, bookmark.createdAt, bookmark.updatedAt])
         var bookmarkId = res.lastID
-        for (let tag of bookmark.content.tags) {
+        for (let tag of bookmark.tags) {
           await db.run(`INSERT OR IGNORE INTO crawl_tags (tag) VALUES (?)`, [tag])
           let tagRow = await db.get(`SELECT id FROM crawl_tags WHERE tag = ?`, [tag])
           await db.run(`INSERT INTO crawl_bookmarks_tags (crawlBookmarkId, crawlTagId) VALUES (?, ?)`, [bookmarkId, tagRow.id])
@@ -240,27 +238,33 @@ const getBookmark = exports.getBookmark = async function (url) {
  * Create a new bookmark.
  *
  * @param {InternalDatArchive} archive - where to write the bookmark to.
- * @param {Object} content
- * @param {string} content.href
- * @param {string} content.title
- * @param {string?} content.description
- * @param {string?|string[]?} content.tags
+ * @param {Object} bookmark
+ * @param {string} bookmark.href
+ * @param {string} bookmark.title
+ * @param {string?} bookmark.description
+ * @param {string?|string[]?} bookmark.tags
  * @returns {Promise<string>} url
  */
-exports.addBookmark = async function (archive, content) {
-  if (content && typeof content.tags === 'string') content.tags = content.tags.split(' ')
-  var valid = validateBookmarkContent(content)
-  if (!valid) throw ajv.errorsText(validateBookmarkContent.errors)
+exports.addBookmark = async function (archive, bookmark) {
+  if (bookmark && typeof bookmark.tags === 'string') bookmark.tags = bookmark.tags.split(' ')
+
+  var bookmarkObject = {
+    type: JSON_TYPE,
+    href: bookmark.href,
+    title: bookmark.title,
+    description: bookmark.description,
+    tags: bookmark.tags,
+    createdAt: (new Date()).toISOString()
+  }
+
+  var valid = validateBookmark(bookmarkObject)
+  if (!valid) throw ajv.errorsText(validateBookmark.errors)
 
   var filename = generateTimeFilename()
   var filepath = `/data/bookmarks/${filename}.json`
   await ensureDirectory(archive, '/data')
   await ensureDirectory(archive, '/data/bookmarks')
-  await archive.pda.writeFile(filepath, JSON.stringify({
-    type: JSON_TYPE,
-    content,
-    createdAt: (new Date()).toISOString()
-  }, null, 2))
+  await archive.pda.writeFile(filepath, JSON.stringify(bookmarkObject, null, 2))
   await crawler.crawlSite(archive)
   return archive.url + filepath
 }
@@ -271,24 +275,31 @@ exports.addBookmark = async function (archive, content) {
  *
  * @param {InternalDatArchive} archive - where to write the bookmark to.
  * @param {string} pathname - the pathname of the bookmark.
- * @param {Object} content
- * @param {string} content.href
- * @param {string} content.title
- * @param {string?} content.description
- * @param {string?|string[]?} content.tags
+ * @param {Object} bookmark
+ * @param {string} bookmark.href
+ * @param {string} bookmark.title
+ * @param {string?} bookmark.description
+ * @param {string?|string[]?} bookmark.tags
  * @returns {Promise<void>}
  */
-exports.editBookmark = async function (archive, pathname, content) {
-  if (content && typeof content.tags === 'string') content.tags = content.tags.split(' ')
-  var valid = validateBookmarkContent(content)
-  if (!valid) throw ajv.errorsText(validateBookmarkContent.errors)
-  var oldJson = JSON.parse(await archive.pda.readFile(pathname))
-  await archive.pda.writeFile(pathname, JSON.stringify({
+exports.editBookmark = async function (archive, pathname, bookmark) {
+  if (bookmark && typeof bookmark.tags === 'string') bookmark.tags = bookmark.tags.split(' ')
+  var existingBookmark = JSON.parse(await archive.pda.readFile(pathname))
+
+  var bookmarkObject = {
     type: JSON_TYPE,
-    content,
-    createdAt: oldJson.createdAt,
+    href: bookmark.href ? bookmark.href : existingBookmark.title,
+    title: ('title' in bookmark) ? bookmark.title : existingBookmark.title,
+    description: ('description' in bookmark) ? bookmark.description : existingBookmark.description,
+    tags: ('tags' in bookmark) ? bookmark.tags : existingBookmark.tags,
+    createdAt: existingBookmark.createdAt,
     updatedAt: (new Date()).toISOString()
-  }, null, 2))
+  }
+
+  var valid = validateBookmark(bookmark)
+  if (!valid) throw ajv.errorsText(validateBookmark.errors)
+  
+  await archive.pda.writeFile(pathname, JSON.stringify(bookmarkObject, null, 2))
   await crawler.crawlSite(archive)
 }
 
@@ -357,12 +368,10 @@ async function massageBookmarkRow (row) {
   return {
     pathname: row.pathname,
     author,
-    content: {
-      href: row.href,
-      title: row.title,
-      description: row.description,
-      tags: row.tags ? row.tags.split(',').filter(Boolean) : []
-    },
+    href: row.href,
+    title: row.title,
+    description: row.description,
+    tags: row.tags ? row.tags.split(',').filter(Boolean) : [],
     crawledAt: row.crawledAt,
     createdAt: row.createdAt,
     updatedAt: row.updatedAt
diff --git a/crawler/json-schemas/bookmark.js b/crawler/json-schemas/bookmark.js
index b215c46f..ae22fbeb 100644
--- a/crawler/json-schemas/bookmark.js
+++ b/crawler/json-schemas/bookmark.js
@@ -1,53 +1,47 @@
 module.exports = {
-  '$schema': 'http://json-schema.org/draft-07/schema#',
-  '$id': 'dat://unwalled.garden/bookmark.json',
-  'type': 'object',
-  'title': 'Bookmark',
-  'description': 'A saved/shared link to some URL.',
-  'required': ['type', 'content', 'createdAt'],
-  'properties': {
-    'type': {
-      'type': 'string',
-      'description': "The object's type",
-      'const': 'unwalled.garden/bookmark'
+  "$schema": "http://json-schema.org/draft-07/schema#",
+  "$id": "dat://unwalled.garden/bookmark.json",
+  "type": "object",
+  "title": "Bookmark",
+  "description": "A saved/shared link to some URL.",
+  "required": ["type", "href", "title", "createdAt"],
+  "properties": {
+    "type": {
+      "type": "string",
+      "description": "The object's type",
+      "const": "unwalled.garden/bookmark"
     },
-    'content': {
-      'type': 'object',
-      'required': ['href', 'title'],
-      'properties': {
-        'href': {
-          'type': 'string',
-          'format': 'uri',
-          'examples': [
-            'dat://beakerbrowser.com'
-          ],
-          'maxLength': 10000
-        },
-        'title': {
-          'type': 'string',
-          'maxLength': 280
-        },
-        'description': {
-          'type': 'string',
-          'maxLength': 560
-        },
-        'tags': {
-          'type': 'array',
-          'items': {
-            'type': 'string',
-            'maxLength': 100,
-            'pattern': '^[A-Za-z][A-Za-z0-9-_?]*$'
-          }
-        }
+    "href": {
+      "type": "string",
+      "format": "uri",
+      "maxLength": 10000
+    },
+    "title": {
+      "type": "string",
+      "maxLength": 280
+    },
+    "description": {
+      "type": "string",
+      "maxLength": 560
+    },
+    "tags": {
+      "type": "array",
+      "items": {
+        "type": "string",
+        "maxLength": 100,
+        "pattern": "^[A-Za-z][A-Za-z0-9-_?]*$"
       }
     },
-    'createdAt': {
-      'type': 'string',
-      'format': 'date-time'
+    "ext": {
+      "type": "object"
+    },
+    "createdAt": {
+      "type": "string",
+      "format": "date-time"
     },
-    'updatedAt': {
-      'type': 'string',
-      'format': 'date-time'
+    "updatedAt": {
+      "type": "string",
+      "format": "date-time"
     }
   }
 }
\ No newline at end of file
diff --git a/web-apis/bg/bookmarks.js b/web-apis/bg/bookmarks.js
index 2772a604..41e6fbae 100644
--- a/web-apis/bg/bookmarks.js
+++ b/web-apis/bg/bookmarks.js
@@ -239,13 +239,25 @@ function normalizeInternalBookmark (bookmark, user) {
   return bookmark
 }
 
-function normalizeUWBookmark (uwBookmark, user, pinneds) {
-  var bookmark = uwBookmark.content
-  bookmark.record = {url: uwBookmark.author.url + uwBookmark.pathname}
-  bookmark.createdAt = uwBookmark.createdAt
-  bookmark.isPublic = true
-  bookmark.author = uwBookmark.author
-  bookmark.isOwner = bookmark.author.url === user.url
-  bookmark.pinned = bookmark.isOwner && pinneds.find(p => p.href === bookmark.href)
-  return bookmark
+/**
+ * 
+ * @param {*} bookmark 
+ * @param {*} user 
+ * @param {*} pinneds 
+ * @returns {BookmarkPublicAPIRecord}
+ */
+function normalizeUWBookmark (bookmark, user, pinneds) {
+  return {
+    record: {url: bookmark.author.url + bookmark.pathname},
+    author: bookmark.author,
+    href: bookmark.href,
+    title: bookmark.title,
+    description: bookmark.description,
+    tags: bookmark.tags,
+    createdAt: bookmark.createdAt,
+    isOwner: bookmark.isOwner,
+    pinned: bookmark.isOwner && pinneds.find(p => p.href === bookmark.href),
+    pinOrder: 0,
+    isPublic: true
+  }
 }

From ee3b91cf7e6799124cf7a31935ac389dc01ce4b7 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 17 Jun 2019 15:57:19 -0500
Subject: [PATCH 185/245] Linter

---
 crawler/bookmarks.js             |  2 +-
 crawler/json-schemas/bookmark.js | 70 ++++++++++++++++----------------
 web-apis/bg/bookmarks.js         |  8 ++--
 3 files changed, 40 insertions(+), 40 deletions(-)

diff --git a/crawler/bookmarks.js b/crawler/bookmarks.js
index 2985f481..1c6a078c 100644
--- a/crawler/bookmarks.js
+++ b/crawler/bookmarks.js
@@ -298,7 +298,7 @@ exports.editBookmark = async function (archive, pathname, bookmark) {
 
   var valid = validateBookmark(bookmark)
   if (!valid) throw ajv.errorsText(validateBookmark.errors)
-  
+
   await archive.pda.writeFile(pathname, JSON.stringify(bookmarkObject, null, 2))
   await crawler.crawlSite(archive)
 }
diff --git a/crawler/json-schemas/bookmark.js b/crawler/json-schemas/bookmark.js
index ae22fbeb..80ae5660 100644
--- a/crawler/json-schemas/bookmark.js
+++ b/crawler/json-schemas/bookmark.js
@@ -1,47 +1,47 @@
 module.exports = {
-  "$schema": "http://json-schema.org/draft-07/schema#",
-  "$id": "dat://unwalled.garden/bookmark.json",
-  "type": "object",
-  "title": "Bookmark",
-  "description": "A saved/shared link to some URL.",
-  "required": ["type", "href", "title", "createdAt"],
-  "properties": {
-    "type": {
-      "type": "string",
-      "description": "The object's type",
-      "const": "unwalled.garden/bookmark"
+  '$schema': 'http://json-schema.org/draft-07/schema#',
+  '$id': 'dat://unwalled.garden/bookmark.json',
+  'type': 'object',
+  'title': 'Bookmark',
+  'description': 'A saved/shared link to some URL.',
+  'required': ['type', 'href', 'title', 'createdAt'],
+  'properties': {
+    'type': {
+      'type': 'string',
+      'description': "The object's type",
+      'const': 'unwalled.garden/bookmark'
     },
-    "href": {
-      "type": "string",
-      "format": "uri",
-      "maxLength": 10000
+    'href': {
+      'type': 'string',
+      'format': 'uri',
+      'maxLength': 10000
     },
-    "title": {
-      "type": "string",
-      "maxLength": 280
+    'title': {
+      'type': 'string',
+      'maxLength': 280
     },
-    "description": {
-      "type": "string",
-      "maxLength": 560
+    'description': {
+      'type': 'string',
+      'maxLength': 560
     },
-    "tags": {
-      "type": "array",
-      "items": {
-        "type": "string",
-        "maxLength": 100,
-        "pattern": "^[A-Za-z][A-Za-z0-9-_?]*$"
+    'tags': {
+      'type': 'array',
+      'items': {
+        'type': 'string',
+        'maxLength': 100,
+        'pattern': '^[A-Za-z][A-Za-z0-9-_?]*$'
       }
     },
-    "ext": {
-      "type": "object"
+    'ext': {
+      'type': 'object'
     },
-    "createdAt": {
-      "type": "string",
-      "format": "date-time"
+    'createdAt': {
+      'type': 'string',
+      'format': 'date-time'
     },
-    "updatedAt": {
-      "type": "string",
-      "format": "date-time"
+    'updatedAt': {
+      'type': 'string',
+      'format': 'date-time'
     }
   }
 }
\ No newline at end of file
diff --git a/web-apis/bg/bookmarks.js b/web-apis/bg/bookmarks.js
index 41e6fbae..dc91e9c5 100644
--- a/web-apis/bg/bookmarks.js
+++ b/web-apis/bg/bookmarks.js
@@ -240,10 +240,10 @@ function normalizeInternalBookmark (bookmark, user) {
 }
 
 /**
- * 
- * @param {*} bookmark 
- * @param {*} user 
- * @param {*} pinneds 
+ *
+ * @param {*} bookmark
+ * @param {*} user
+ * @param {*} pinneds
  * @returns {BookmarkPublicAPIRecord}
  */
 function normalizeUWBookmark (bookmark, user, pinneds) {

From aed751478ab22db71a02d01046c7ae6083514721 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 17 Jun 2019 18:31:41 -0500
Subject: [PATCH 186/245] Implement unwalled-garden-votes API

---
 crawler/index.js                              |   5 +-
 crawler/json-schemas/vote.js                  |  36 ++
 crawler/votes.js                              | 382 ++++++++++++++++++
 dbs/profile-data-db.js                        |   3 +-
 dbs/schemas/profile-data.sql.js               |  18 +-
 dbs/schemas/profile-data.v29.sql.js           |  20 +
 web-apis/bg.js                                |   3 +
 web-apis/bg/unwalled-garden-votes.js          | 203 ++++++++++
 web-apis/fg/navigator-import.js               |   4 +
 .../external/unwalled-garden-votes.js         |   6 +
 10 files changed, 677 insertions(+), 3 deletions(-)
 create mode 100644 crawler/json-schemas/vote.js
 create mode 100644 crawler/votes.js
 create mode 100644 dbs/schemas/profile-data.v29.sql.js
 create mode 100644 web-apis/bg/unwalled-garden-votes.js
 create mode 100644 web-apis/manifests/external/unwalled-garden-votes.js

diff --git a/crawler/index.js b/crawler/index.js
index e728864b..0cb4ebb7 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -13,6 +13,7 @@ const bookmarks = require('./bookmarks')
 const follows = require('./follows')
 const reactions = require('./reactions')
 const siteDescriptions = require('./site-descriptions')
+const votes = require('./votes')
 
 // globals
 // =
@@ -28,6 +29,7 @@ exports.bookmarks = bookmarks
 exports.follows = follows
 exports.reactions = reactions
 exports.siteDescriptions = siteDescriptions
+exports.votes = votes
 const createEventsStream = exports.createEventsStream = () => emitStream(crawlerEvents)
 
 exports.setup = async function () {
@@ -92,7 +94,8 @@ exports.crawlSite = async function (archive) {
       bookmarks.crawlSite(archive, crawlSource),
       follows.crawlSite(archive, crawlSource),
       reactions.crawlSite(archive, crawlSource),
-      siteDescriptions.crawlSite(archive, crawlSource)
+      siteDescriptions.crawlSite(archive, crawlSource),
+      votes.crawlSite(archive, crawlSource)
     ])
   } catch (err) {
     logger.error('Failed to crawl site', {details: {url: archive.url, err: err.toString()}})
diff --git a/crawler/json-schemas/vote.js b/crawler/json-schemas/vote.js
new file mode 100644
index 00000000..74b17aeb
--- /dev/null
+++ b/crawler/json-schemas/vote.js
@@ -0,0 +1,36 @@
+module.exports = {
+  '$schema': 'http://json-schema.org/draft-07/schema#',
+  '$id': 'dat://unwalled.garden/vote.json',
+  'type': 'object',
+  'title': 'Vote',
+  'description': 'A vote up or down on some resource.',
+  'required': [
+    'type',
+    'topic',
+    'vote',
+    'createdAt'
+  ],
+  'properties': {
+    'type': {
+      'type': 'string',
+      'description': "The object's type",
+      'const': 'unwalled.garden/vote'
+    },
+    'topic': {
+      'type': 'string',
+      'format': 'uri'
+    },
+    'vote': {
+      'type': 'number',
+      'enum': [-1, 1]
+    },
+    'createdAt': {
+      'type': 'string',
+      'format': 'date-time',
+    },
+    'updatedAt': {
+      'type': 'string',
+      'format': 'date-time'
+    }
+  }
+}
\ No newline at end of file
diff --git a/crawler/votes.js b/crawler/votes.js
new file mode 100644
index 00000000..dbab21a4
--- /dev/null
+++ b/crawler/votes.js
@@ -0,0 +1,382 @@
+const assert = require('assert')
+const {URL} = require('url')
+const Events = require('events')
+const Ajv = require('ajv')
+const logger = require('../logger').child({category: 'crawler', dataset: 'votes'})
+const db = require('../dbs/profile-data-db')
+const crawler = require('./index')
+const knex = require('../lib/knex')
+const siteDescriptions = require('./site-descriptions')
+const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, ensureDirectory, toOrigin, generateTimeFilename} = require('./util')
+const voteSchema = require('./json-schemas/vote')
+
+// constants
+// =
+
+const TABLE_VERSION = 1
+const JSON_TYPE = 'unwalled.garden/vote'
+const JSON_PATH_REGEX = /^\/data\/votes\/([^/]+)\.json$/i
+
+// typedefs
+// =
+
+/**
+ * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
+ * @typedef {import('./util').CrawlSourceRecord} CrawlSourceRecord
+ * @typedef { import("./site-descriptions").SiteDescription } SiteDescription
+ *
+ * @typedef {Object} Vote
+ * @prop {string} pathname
+ * @prop {string} topic
+ * @prop {number} vote
+ * @prop {string} createdAt
+ * @prop {string} updatedAt
+ * @prop {SiteDescription} author
+ * @prop {string} visibility
+ *
+ * @typedef {Object} TabulatedVotes
+ * @prop {string} topic
+ * @prop {number} upvotes
+ * @prop {SiteDescription[]} upvoters
+ * @prop {number} downvotes
+ * @prop {SiteDescription[]} downvoters
+ */
+
+// globals
+// =
+
+const events = new Events()
+const ajv = (new Ajv())
+const validateVote = ajv.compile(voteSchema)
+
+// exported api
+// =
+
+exports.on = events.on.bind(events)
+exports.addListener = events.addListener.bind(events)
+exports.removeListener = events.removeListener.bind(events)
+
+/**
+ * @description
+ * Crawl the given site for votes.
+ *
+ * @param {InternalDatArchive} archive - site to crawl.
+ * @param {CrawlSourceRecord} crawlSource - internal metadata about the crawl target.
+ * @returns {Promise}
+ */
+exports.crawlSite = async function (archive, crawlSource) {
+  return doCrawl(archive, crawlSource, 'crawl_votes', TABLE_VERSION, async ({changes, resetRequired}) => {
+    const supressEvents = resetRequired === true // dont emit when replaying old info
+    logger.silly('Crawling votes', {details: {url: archive.url, numChanges: changes.length, resetRequired}})
+    if (resetRequired) {
+      // reset all data
+      logger.debug('Resetting dataset', {details: {url: archive.url}})
+      await db.run(`
+        DELETE FROM crawl_votes WHERE crawlSourceId = ?
+      `, [crawlSource.id])
+      await doCheckpoint('crawl_votes', TABLE_VERSION, crawlSource, 0)
+    }
+
+    // collect changed votes
+    var changedVotes = getMatchingChangesInOrder(changes, JSON_PATH_REGEX)
+    if (changedVotes.length) {
+      logger.verbose('Collected new/changed vote files', {details: {url: archive.url, changedVotes: changedVotes.map(p => p.name)}})
+    } else {
+      logger.debug('No new vote-files found', {details: {url: archive.url}})
+    }
+    emitProgressEvent(archive.url, 'crawl_votes', 0, changedVotes.length)
+
+    // read and apply each vote in order
+    var progress = 0
+    for (let changedVote of changedVotes) {
+      // TODO Currently the crawler will abort reading the feed if any vote fails to load
+      //      this means that a single unreachable file can stop the forward progress of vote indexing
+      //      to solve this, we need to find a way to tolerate unreachable vote-files without losing our ability to efficiently detect new votes
+      //      -prf
+      if (changedVote.type === 'del') {
+        // delete
+        await db.run(`
+          DELETE FROM crawl_votes WHERE crawlSourceId = ? AND pathname = ?
+        `, [crawlSource.id, changedVote.name])
+        events.emit('vote-updated', archive.url)
+      } else {
+        // read
+        let fileString
+        try {
+          fileString = await archive.pda.readFile(changedVote.name, 'utf8')
+        } catch (err) {
+          logger.warn('Failed to read vote file, aborting', {details: {url: archive.url, name: changedVote.name, err}})
+          return // abort indexing
+        }
+
+        // parse and validate
+        let vote
+        try {
+          vote = JSON.parse(fileString)
+          let valid = validateVote(vote)
+          if (!valid) throw ajv.errorsText(validateVote.errors)
+        } catch (err) {
+          logger.warn('Failed to parse vote file, skipping', {details: {url: archive.url, name: changedVote.name, err}})
+          continue // skip
+        }
+
+        // massage record
+        vote.topic = normalizeTopicUrl(vote.topic)
+        vote.createdAt = Number(new Date(vote.createdAt))
+        vote.updatedAt = Number(new Date(vote.updatedAt))
+        if (isNaN(vote.updatedAt)) vote.updatedAt = 0 // optional
+
+        // delete existing
+        await db.run(knex('crawl_votes').where({crawlSourceId: crawlSource.id, topic: vote.topic}).del())
+
+        // insert new
+        await db.run(knex('crawl_votes').insert({
+          crawlSourceId: crawlSource.id,
+          pathname: changedVote.name,
+          crawledAt: Date.now(),
+          topic: vote.topic,
+          vote: vote.vote,
+          createdAt: vote.createdAt,
+          updatedAt: vote.updatedAt
+        }))
+        events.emit('vote-updated', archive.url)
+      }
+
+      // checkpoint our progress
+      logger.silly(`Finished crawling votes`, {details: {url: archive.url}})
+      await doCheckpoint('crawl_votes', TABLE_VERSION, crawlSource, changedVote.version)
+      emitProgressEvent(archive.url, 'crawl_votes', ++progress, changedVotes.length)
+    }
+  })
+}
+
+/**
+ * @description
+ * List crawled votes.
+ *
+ * @param {Object} [opts]
+ * @param {Object} [opts.filters]
+ * @param {string|string[]} [opts.filters.authors]
+ * @param {string|string[]} [opts.filters.topics]
+ * @param {string} [opts.filters.visibility]
+ * @param {string} [opts.sortBy]
+ * @param {number} [opts.offset=0]
+ * @param {number} [opts.limit]
+ * @param {boolean} [opts.reverse]
+ * @returns {Promise<Array<Vote>>}
+ */
+exports.list = async function (opts) {
+  // TODO: handle visibility
+  // TODO: sortBy options
+
+  // validate & parse params
+  if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
+  if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+  if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+  if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+  if (opts && opts.filters) {
+    if ('authors' in opts.filters) {
+      if (Array.isArray(opts.filters.authors)) {
+        assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        opts.filters.authors = [opts.filters.authors]
+      }
+      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+    }
+    if ('topics' in opts.filters) {
+      if (Array.isArray(opts.filters.topics)) {
+        assert(opts.filters.topics.every(v => typeof v === 'string'), 'Topics filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.topics === 'string', 'Topics filter must be a string or array of strings')
+        opts.filters.topics = [opts.filters.topics]
+      }
+      opts.filters.topics = opts.filters.topics.map(normalizeTopicUrl)
+    }
+    if ('visibility' in opts.filters) {
+      assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+    }
+  }
+
+  // execute query
+  let sql = knex('crawl_votes')
+    .select('crawl_votes.*')
+    .select('crawl_sources.url AS author')
+    .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_votes.crawlSourceId')
+    .orderBy('crawl_votes.topic', opts.reverse ? 'DESC' : 'ASC')
+  if (opts.limit) sql = sql.limit(opts.limit)
+  if (opts.offset) sql = sql.offset(opts.offset)
+  if (opts && opts.filters && opts.filters.authors) {
+    sql = sql.whereIn('crawl_sources.url', opts.filters.authors)
+  }
+  if (opts && opts.filters && opts.filters.topics) {
+    sql = sql.whereIn('crawl_votes.topic', opts.filters.topics)
+  }
+  var rows = await db.all(sql)
+
+  // massage results
+  return Promise.all(rows.map(massageVoteRow))
+}
+
+/**
+ * @description
+ * List crawled votes on a topic.
+ *
+ * @param {string} topic - The URL of the topic
+ * @param {Object} [opts]
+ * @param {Object} [opts.filters]
+ * @param {string|string[]} [opts.filters.authors]
+ * @param {string} [opts.filters.visibility]
+ * @returns {Promise<TabulatedVotes>}
+ */
+exports.tabulate = async function (topic, opts) {
+  // TODO handle visibility
+
+  // validate params
+  try { new URL(topic) }
+  catch (e) { throw new Error('Invalid URL: ' + topic) }
+  if (opts && opts.filters) {
+    if ('authors' in opts.filters) {
+      if (Array.isArray(opts.filters.authors)) {
+        assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        opts.filters.authors = [opts.filters.authors]
+      }
+      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+    }
+    if ('visibility' in opts.filters) {
+      assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+    }
+  }
+
+  // execute query
+  var sql = knex('crawl_votes')
+    .select('crawl_votes.*')
+    .select('crawl_sources.url AS crawlSourceUrl')
+    .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_votes.crawlSourceId')
+    .where('crawl_votes.topic', topic)
+  if (opts && opts.filters && opts.filters.authors) {
+    sql = sql.whereIn('crawl_sources.url', opts.filters.authors)
+  }
+  var rows = await db.all(sql)
+
+  // construct votes tally
+  var tally = {
+    topic,
+    upvotes: 0,
+    upvoters: [],
+    downvotes: 0,
+    downvoters: []
+  }
+  await Promise.all(rows.map(async (row) => {
+    let author = await siteDescriptions.getBest({subject: row.crawlSourceUrl})
+    if ((+row.vote) === 1) {
+      tally.upvotes++
+      tally.upvoters.push(author)
+    } else {
+      tally.downvotes++
+      tally.downvoters.push(author)
+    }
+  }))
+  return tally
+}
+
+/**
+ * @description
+ * Get crawled vote.
+ *
+ * @param {string} author - The URL of the author
+ * @param {string} topic - The URL of the topic
+ * @returns {Promise<Vote>}
+ */
+const get = exports.get = async function (author, topic) {
+  author = toOrigin(author, true)
+  topic = normalizeTopicUrl(topic)
+
+  // execute query
+  var sql = knex('crawl_votes')
+    .select('crawl_votes.*')
+    .select('crawl_sources.url AS crawlSourceUrl')
+    .innerJoin('crawl_sources', function () {
+      this.on('crawl_sources.id', '=', 'crawl_votes.crawlSourceId')
+        .andOn('crawl_sources.url', '=', knex.raw('?', author))
+    })
+    .where('crawl_votes.topic', topic)
+  return await massageVoteRow(await db.get(sql))
+}
+
+/**
+ * @description
+ * Set a vote.
+ *
+ * @param {InternalDatArchive} archive - where to write the vote to.
+ * @param {string} topic
+ * @param {number} vote
+ * @returns {Promise<void>}
+ */
+exports.set = async function (archive, topic, vote) {
+  // TODO handle visibility
+
+  // get the existing vote if it exists
+  let existingVote = await get(archive.url, topic)
+
+  var voteObject = {
+    type: JSON_TYPE,
+    topic: normalizeTopicUrl(topic),
+    vote,
+    createdAt: existingVote ? existingVote.createdAt : (new Date()).toISOString()
+  }
+  if (existingVote) {
+    voteObject.updatedAt = (new Date()).toISOString()
+  }
+
+  var valid = validateVote(voteObject)
+  if (!valid) throw ajv.errorsText(validateVote.errors)
+
+  var filename = existingVote ? existingVote.createdAt : generateTimeFilename()
+  var filepath = `/data/votes/${filename}.json`
+  await ensureDirectory(archive, '/data')
+  await ensureDirectory(archive, '/data/votes')
+  await archive.pda.writeFile(filepath, JSON.stringify(voteObject, null, 2))
+  await crawler.crawlSite(archive)
+}
+
+// internal methods
+// =
+
+function normalizeTopicUrl (url) {
+  try {
+    url = new URL(url)
+    return (url.protocol + '//' + url.hostname + url.pathname + url.search + url.hash).replace(/([/]$)/g, '')
+  } catch (e) {}
+  return null
+}
+
+/**
+ * @param {Object} row
+ * @returns {Promise<Vote>}
+ */
+async function massageVoteRow (row) {
+  if (!row) return null
+  var author = await siteDescriptions.getBest({subject: row.crawlSourceUrl})
+  if (!author) {
+    author = {
+      url: row.crawlSourceUrl,
+      title: '',
+      description: '',
+      type: [],
+      thumbUrl: `${row.crawlSourceUrl}/thumb`,
+      descAuthor: {url: null}
+    }
+  }
+  return {
+    pathname: row.pathname,
+    author,
+    topic: row.topic,
+    vote: row.vote,
+    createdAt: new Date(row.createdAt).toISOString(),
+    updatedAt: row.updatedAt ? new Date(row.updatedAt).toISOString() : null,
+    visibility: 'public' // TODO visibility
+  }
+}
\ No newline at end of file
diff --git a/dbs/profile-data-db.js b/dbs/profile-data-db.js
index 1e9531b4..915947ee 100644
--- a/dbs/profile-data-db.js
+++ b/dbs/profile-data-db.js
@@ -115,7 +115,8 @@ migrations = [
   migration('profile-data.v25.sql'),
   migration('profile-data.v26.sql'),
   migration('profile-data.v27.sql'),
-  migration('profile-data.v28.sql')
+  migration('profile-data.v28.sql'),
+  migration('profile-data.v29.sql')
 ]
 function migration (file, opts = {}) {
   return cb => {
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index 869fb916..b2f0521c 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -232,6 +232,22 @@ CREATE TABLE crawl_reactions (
 );
 CREATE INDEX crawl_reactions_topic ON crawl_reactions (topic);
 
+-- crawled votes
+CREATE TABLE crawl_votes (
+  crawlSourceId INTEGER NOT NULL,
+  pathname TEXT NOT NULL,
+  crawledAt INTEGER,
+  
+  topic TEXT NOT NULL,
+  vote INTEGER NOT NULL,
+  createdAt INTEGER,
+  updatedAt INTEGER,
+
+  PRIMARY KEY (crawlSourceId, pathname),
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+CREATE INDEX crawl_votes_topic ON crawl_votes (topic);
+
 -- crawled bookmarks
 CREATE TABLE crawl_bookmarks (
   id INTEGER PRIMARY KEY,
@@ -344,5 +360,5 @@ INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Library', 'beaker://library/', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker.Social', 'dat://beaker.social', 1);
 
-PRAGMA user_version = 28;
+PRAGMA user_version = 29;
 `
diff --git a/dbs/schemas/profile-data.v29.sql.js b/dbs/schemas/profile-data.v29.sql.js
new file mode 100644
index 00000000..9c592154
--- /dev/null
+++ b/dbs/schemas/profile-data.v29.sql.js
@@ -0,0 +1,20 @@
+module.exports = `
+
+-- add crawled votes
+CREATE TABLE crawl_votes (
+  crawlSourceId INTEGER NOT NULL,
+  pathname TEXT NOT NULL,
+  crawledAt INTEGER,
+  
+  topic TEXT NOT NULL,
+  vote INTEGER NOT NULL,
+  createdAt INTEGER,
+  updatedAt INTEGER,
+
+  PRIMARY KEY (crawlSourceId, pathname),
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+CREATE INDEX crawl_votes_topic ON crawl_votes (topic);
+
+PRAGMA user_version = 29;
+`
\ No newline at end of file
diff --git a/web-apis/bg.js b/web-apis/bg.js
index b3d328f0..c6ebeb91 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -33,6 +33,7 @@ const commentsManifest = require('./manifests/external/unwalled-garden-comments'
 const postsManifest = require('./manifests/external/unwalled-garden-posts')
 const followsManifest = require('./manifests/external/unwalled-garden-follows')
 const reactionsManifest = require('./manifests/external/unwalled-garden-reactions')
+const votesManifest = require('./manifests/external/unwalled-garden-votes')
 
 // external apis
 const datArchiveAPI = require('./bg/dat-archive')
@@ -45,6 +46,7 @@ const commentsAPI = require('./bg/unwalled-garden-comments')
 const postsAPI = require('./bg/unwalled-garden-posts')
 const followsAPI = require('./bg/unwalled-garden-follows')
 const reactionsAPI = require('./bg/unwalled-garden-reactions')
+const votesAPI = require('./bg/unwalled-garden-votes')
 
 // experimental manifests
 const experimentalCapturePageManifest = require('./manifests/external/experimental/capture-page')
@@ -82,6 +84,7 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('unwalled-garden-posts', postsManifest, postsAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-follows', followsManifest, followsAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-reactions', reactionsManifest, reactionsAPI, secureOnly)
+  globals.rpcAPI.exportAPI('unwalled-garden-votes', votesManifest, votesAPI, secureOnly)
 
   // experimental apis
   globals.rpcAPI.exportAPI('experimental-capture-page', experimentalCapturePageManifest, experimentalCapturePageAPI, secureOnly)
diff --git a/web-apis/bg/unwalled-garden-votes.js b/web-apis/bg/unwalled-garden-votes.js
new file mode 100644
index 00000000..a4c37232
--- /dev/null
+++ b/web-apis/bg/unwalled-garden-votes.js
@@ -0,0 +1,203 @@
+const globals = require('../../globals')
+const assert = require('assert')
+const {URL} = require('url')
+const {PermissionsError} = require('beaker-error-constants')
+const dat = require('../../dat')
+const votesCrawler = require('../../crawler/votes')
+const siteDescriptionsCrawler = require('../../crawler/site-descriptions')
+
+// typedefs
+// =
+
+/**
+ * @typedef {import('../../crawler/votes').Vote} Vote
+ * @typedef {import('../../crawler/votes').TabulatedVotes} TabulatedVotes
+ *
+ * @typedef {Object} VoteAuthorPublicAPIRecord
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {string[]} type
+ *
+ * @typedef {Object} TabulatedVotesPublicAPIRecord
+ * @prop {string} topic
+ * @prop {number} upvotes
+ * @prop {VoteAuthorPublicAPIRecord[]} upvoters
+ * @prop {number} downvotes
+ * @prop {VoteAuthorPublicAPIRecord[]} downvoters
+ *
+ * @typedef {Object} VotePublicAPIRecord
+ * @prop {string} url
+ * @prop {string} topic
+ * @prop {number} vote
+ * @prop {string} createdAt
+ * @prop {string} updatedAt
+ * @prop {VoteAuthorPublicAPIRecord} author
+ * @prop {string} visibility
+ */
+
+// exported api
+// =
+
+module.exports = {
+  /**
+   * @param {Object} [opts]
+   * @param {Object} [opts.filters]
+   * @param {string|string[]} [opts.filters.authors]
+   * @param {string|string[]} [opts.filters.topics]
+   * @param {string} [opts.filters.visibility]
+   * @param {string} [opts.sortBy]
+   * @param {number} [opts.offset=0]
+   * @param {number} [opts.limit]
+   * @param {boolean} [opts.reverse]
+   * @returns {Promise<VotePublicAPIRecord[]>}
+   */
+  async list (opts) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    opts = (opts && typeof opts === 'object') ? opts : {}
+    if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
+    if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+    if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+    if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+    if (opts && opts.filters) {
+      if ('authors' in opts.filters) {
+        if (Array.isArray(opts.filters.authors)) {
+          assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        }
+      }
+      if ('topics' in opts.filters) {
+        if (Array.isArray(opts.filters.topics)) {
+          assert(opts.filters.topics.every(v => typeof v === 'string'), 'Topics filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.topics === 'string', 'Topics filter must be a string or array of strings')
+        }
+      }
+      if ('visibility' in opts.filters) {
+        assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+      }
+    }
+    var votes = await votesCrawler.list(opts)
+    return votes.map(massageVoteRecord)
+  },
+
+  /**
+   * @param {string} topic
+   * @param {Object} [opts]
+   * @param {string|string[]} [opts.filters.authors]
+   * @param {string} [opts.filters.visibility]
+   * @returns {Promise<TabulatedVotesPublicAPIRecord>}
+   */
+  async tabulate (topic, opts) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    topic = normalizeTopicUrl(topic)
+    assert(topic && typeof topic === 'string', 'The `topic` parameter must be a valid URL')
+    opts = (opts && typeof opts === 'object') ? opts : {}
+    if (opts && opts.filters) {
+      if ('authors' in opts.filters) {
+        if (Array.isArray(opts.filters.authors)) {
+          assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        }
+      }
+      if ('visibility' in opts.filters) {
+        assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+      }
+    }
+
+    var tally = await votesCrawler.tabulate(topic, opts)
+    return {
+      topic: tally.topic,
+      upvotes: tally.upvotes,
+      upvoters: tally.upvoters.map(author => ({
+        url: author.url,
+        title: author.title,
+        description: author.description,
+        type: author.type
+      })),
+      downvotes: tally.downvotes,
+      downvoters: tally.downvoters.map(author => ({
+        url: author.url,
+        title: author.title,
+        description: author.description,
+        type: author.type
+      }))
+    }
+  },
+
+  /**
+   * @param {string} author
+   * @param {string} topic
+   * @returns {Promise<VotePublicAPIRecord>}
+   */
+  async get (author, topic) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    return massageVoteRecord(await votesCrawler.get(author, topic))
+  },
+
+  /**
+   * @param {string} topic
+   * @param {string} emoji
+   * @returns {Promise<VotePublicAPIRecord>}
+   */
+  async set (topic, vote) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    var userArchive = getUserArchive(this.sender)
+
+    topic = normalizeTopicUrl(topic)
+    assert(topic && typeof topic === 'string', 'The `topic` parameter must be a valid URL')
+
+    await votesCrawler.set(userArchive, topic, vote)
+    return massageVoteRecord(await votesCrawler.get(userArchive.url, topic))
+  }
+}
+
+// internal methods
+// =
+
+async function assertPermission (sender, perm) {
+  if (sender.getURL().startsWith('beaker:')) {
+    return true
+  }
+  if (await globals.permsAPI.requestPermission(perm, sender)) return true
+  throw new PermissionsError()
+}
+
+function getUserArchive (sender) {
+  var userSession = globals.userSessionAPI.getFor(sender)
+  if (!userSession) throw new Error('No active user session')
+  return dat.library.getArchive(userSession.url)
+}
+
+function normalizeTopicUrl (url) {
+  try {
+    url = new URL(url)
+    return (url.protocol + '//' + url.hostname + url.pathname + url.search + url.hash).replace(/([/]$)/g, '')
+  } catch (e) {}
+  return null
+}
+
+/**
+ * @param {Vote} vote
+ * @returns {VotePublicAPIRecord}
+ */
+function massageVoteRecord (vote) {
+  if (!vote) return null
+  var url =  vote.author.url + vote.pathname
+  return {
+    url,
+    topic: vote.topic,
+    vote: vote.vote,
+    createdAt: vote.createdAt,
+    updatedAt: vote.updatedAt,
+    author: {
+      url: vote.author.url,
+      title: vote.author.title,
+      description: vote.author.description,
+      type: vote.author.type
+    },
+    visibility: vote.visibility
+  }
+}
\ No newline at end of file
diff --git a/web-apis/fg/navigator-import.js b/web-apis/fg/navigator-import.js
index cd59af70..f99af301 100644
--- a/web-apis/fg/navigator-import.js
+++ b/web-apis/fg/navigator-import.js
@@ -43,6 +43,10 @@ const APIs = {
   'unwalled-garden-reactions': {
     manifest: require('../manifests/external/unwalled-garden-reactions'),
     create: makeCreateFn('unwalled-garden-reactions')
+  },
+  'unwalled-garden-votes': {
+    manifest: require('../manifests/external/unwalled-garden-votes'),
+    create: makeCreateFn('unwalled-garden-votes')
   }
 }
 
diff --git a/web-apis/manifests/external/unwalled-garden-votes.js b/web-apis/manifests/external/unwalled-garden-votes.js
new file mode 100644
index 00000000..1577dd67
--- /dev/null
+++ b/web-apis/manifests/external/unwalled-garden-votes.js
@@ -0,0 +1,6 @@
+module.exports = {
+  list: 'promise',
+  tabulate: 'promise',
+  get: 'promise',
+  set: 'promise'
+}
\ No newline at end of file

From 4b4471399886fcc673ebbe66c1a7605caf0c2fcf Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 17 Jun 2019 19:24:53 -0500
Subject: [PATCH 187/245] Add unwalled-garden-discussions web api

---
 crawler/bookmarks.js                          |  11 +
 crawler/discussions.js                        | 427 ++++++++++++++++++
 crawler/index.js                              |  15 +-
 crawler/json-schemas/discussion.js            |  43 ++
 dbs/profile-data-db.js                        |   3 +-
 dbs/schemas/profile-data.sql.js               |  28 +-
 dbs/schemas/profile-data.v30.sql.js           |  30 ++
 web-apis/bg.js                                |   9 +-
 web-apis/bg/unwalled-garden-discussions.js    | 223 +++++++++
 web-apis/fg/navigator-import.js               |  10 +-
 .../external/unwalled-garden-discussions.js   |   7 +
 11 files changed, 792 insertions(+), 14 deletions(-)
 create mode 100644 crawler/discussions.js
 create mode 100644 crawler/json-schemas/discussion.js
 create mode 100644 dbs/schemas/profile-data.v30.sql.js
 create mode 100644 web-apis/bg/unwalled-garden-discussions.js
 create mode 100644 web-apis/manifests/external/unwalled-garden-discussions.js

diff --git a/crawler/bookmarks.js b/crawler/bookmarks.js
index 1c6a078c..9628f114 100644
--- a/crawler/bookmarks.js
+++ b/crawler/bookmarks.js
@@ -155,6 +155,8 @@ exports.crawlSite = async function (archive, crawlSource) {
   * @param {Object} [opts]
   * @param {Object} [opts.filters]
   * @param {string|string[]} [opts.filters.authors]
+  * @param {string|string[]} [opts.filters.tags]
+  * @param {string} [opts.sortBy]
   * @param {number} [opts.offset=0]
   * @param {number} [opts.limit]
   * @param {boolean} [opts.reverse]
@@ -164,6 +166,7 @@ exports.query = async function (opts) {
   // TODO tags filter
 
   // validate & parse params
+  if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'number', 'SortBy must be a string')
   if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
   if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
   if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
@@ -177,6 +180,14 @@ exports.query = async function (opts) {
       }
       opts.filters.authors = opts.filters.authors.map(toAuthorOrigin)
     }
+    if ('tags' in opts.filters) {
+      if (Array.isArray(opts.filters.tags)) {
+        assert(opts.filters.tags.every(v => typeof v === 'string'), 'Tags filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.tags === 'string', 'Tags filter must be a string or array of strings')
+        opts.filters.tags = [opts.filters.tags]
+      }
+    }
   }
 
   // build query
diff --git a/crawler/discussions.js b/crawler/discussions.js
new file mode 100644
index 00000000..c0326996
--- /dev/null
+++ b/crawler/discussions.js
@@ -0,0 +1,427 @@
+const assert = require('assert')
+const {URL} = require('url')
+const Events = require('events')
+const Ajv = require('ajv')
+const logger = require('../logger').child({category: 'crawler', dataset: 'discussions'})
+const db = require('../dbs/profile-data-db')
+const crawler = require('./index')
+const lock = require('../lib/lock')
+const knex = require('../lib/knex')
+const siteDescriptions = require('./site-descriptions')
+const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename, ensureDirectory, toOrigin} = require('./util')
+const discussionSchema = require('./json-schemas/discussion')
+
+// constants
+// =
+
+const TABLE_VERSION = 1
+const JSON_TYPE = 'unwalled.garden/discussion'
+const JSON_PATH_REGEX = /^\/data\/discussions\/([^/]+)\.json$/i
+
+// typedefs
+// =
+
+/**
+ * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
+ * @typedef {import('./util').CrawlSourceRecord} CrawlSourceRecord
+ * @typedef { import("./site-descriptions").SiteDescription } SiteDescription
+ *
+ * @typedef {Object} Discussion
+ * @prop {string} pathname
+ * @prop {string} title
+ * @prop {string} body
+ * @prop {string} href
+ * @prop {string[]} tags
+ * @prop {string} createdAt
+ * @prop {string} updatedAt
+ * @prop {SiteDescription} author
+ * @prop {string} visibility
+ */
+
+// globals
+// =
+
+const events = new Events()
+const ajv = (new Ajv())
+const validateDiscussion = ajv.compile(discussionSchema)
+
+// exported api
+// =
+
+exports.on = events.on.bind(events)
+exports.addListener = events.addListener.bind(events)
+exports.removeListener = events.removeListener.bind(events)
+
+/**
+ * @description
+ * Crawl the given site for discussions.
+ *
+ * @param {InternalDatArchive} archive - site to crawl.
+ * @param {CrawlSourceRecord} crawlSource - internal metadata about the crawl target.
+ * @returns {Promise}
+ */
+exports.crawlSite = async function (archive, crawlSource) {
+  return doCrawl(archive, crawlSource, 'crawl_discussions', TABLE_VERSION, async ({changes, resetRequired}) => {
+    const supressEvents = resetRequired === true // dont emit when replaying old info
+    logger.silly('Crawling discussions', {details: {url: archive.url, numChanges: changes.length, resetRequired}})
+    if (resetRequired) {
+      // reset all data
+      logger.debug('Resetting dataset', {details: {url: archive.url}})
+      await db.run(`
+        DELETE FROM crawl_discussions WHERE crawlSourceId = ?
+      `, [crawlSource.id])
+      await doCheckpoint('crawl_discussions', TABLE_VERSION, crawlSource, 0)
+    }
+
+    // collect changed discussions
+    var changedDiscussions = getMatchingChangesInOrder(changes, JSON_PATH_REGEX)
+    if (changedDiscussions.length) {
+      logger.verbose('Collected new/changed discussion files', {details: {url: archive.url, changedDiscussions: changedDiscussions.map(p => p.name)}})
+    } else {
+      logger.debug('No new discussion-files found', {details: {url: archive.url}})
+    }
+    emitProgressEvent(archive.url, 'crawl_discussions', 0, changedDiscussions.length)
+
+    // read and apply each discussion in order
+    var progress = 0
+    for (let changedDiscussion of changedDiscussions) {
+      // TODO Currently the crawler will abort reading the feed if any discussion fails to load
+      //      this means that a single unreachable file can stop the forward progress of discussion indexing
+      //      to solve this, we need to find a way to tolerate unreachable discussion-files without losing our ability to efficiently detect new discussions
+      //      -prf
+      if (changedDiscussion.type === 'del') {
+        // delete
+        await db.run(`
+          DELETE FROM crawl_discussions WHERE crawlSourceId = ? AND pathname = ?
+        `, [crawlSource.id, changedDiscussion.name])
+        events.emit('discussion-removed', archive.url)
+      } else {
+        // read
+        let discussionString
+        try {
+          discussionString = await archive.pda.readFile(changedDiscussion.name, 'utf8')
+        } catch (err) {
+          logger.warn('Failed to read discussion file, aborting', {details: {url: archive.url, name: changedDiscussion.name, err}})
+          return // abort indexing
+        }
+
+        // parse and validate
+        let discussion
+        try {
+          discussion = JSON.parse(discussionString)
+          let valid = validateDiscussion(discussion)
+          if (!valid) throw ajv.errorsText(validateDiscussion.errors)
+        } catch (err) {
+          logger.warn('Failed to parse discussion file, skipping', {details: {url: archive.url, name: changedDiscussion.name, err}})
+          continue // skip
+        }
+
+        // massage the discussion
+        discussion.createdAt = Number(new Date(discussion.createdAt))
+        discussion.updatedAt = Number(new Date(discussion.updatedAt))
+        if (!discussion.title) discussion.title = '' // optional
+        if (!discussion.href) discussion.href = '' // optional
+        if (!discussion.tags) discussion.tags = [] // optional
+        if (isNaN(discussion.updatedAt)) discussion.updatedAt = 0 // optional
+
+        // upsert
+        let discussionId = 0
+        let existingDiscussion = await db.get(knex('crawl_discussions')
+          .select('id')
+          .where({
+            crawlSourceId: crawlSource.id,
+            pathname: changedDiscussion.name
+          })
+        )
+        if (existingDiscussion) {
+          let res = await db.run(knex('crawl_discussions')
+            .where({
+              crawlSourceId: crawlSource.id,
+              pathname: changedDiscussion.name
+            }).update({
+              crawledAt: Date.now(),
+              title: discussion.title,
+              body: discussion.body,
+              href: discussion.href,
+              createdAt: discussion.createdAt,
+              updatedAt: discussion.updatedAt,
+            })
+          )
+          discussionId = existingDiscussion.id
+          events.emit('discussion-updated', archive.url)
+        } else {
+          let res = await db.run(knex('crawl_discussions')
+            .insert({
+              crawlSourceId: crawlSource.id,
+              pathname: changedDiscussion.name,
+              crawledAt: Date.now(),
+              title: discussion.title,
+              body: discussion.body,
+              href: discussion.href,
+              createdAt: discussion.createdAt,
+              updatedAt: discussion.updatedAt,
+            })
+          )
+          discussionId = +res.lastID
+          events.emit('discussion-added', archive.url)
+        }
+        await db.run(`DELETE FROM crawl_discussions_tags WHERE crawlDiscussionId = ?`, [discussionId])
+        for (let tag of discussion.tags) {
+          await db.run(`INSERT OR IGNORE INTO crawl_tags (tag) VALUES (?)`, [tag])
+          let tagRow = await db.get(`SELECT id FROM crawl_tags WHERE tag = ?`, [tag])
+          await db.run(`INSERT INTO crawl_discussions_tags (crawlDiscussionId, crawlTagId) VALUES (?, ?)`, [discussionId, tagRow.id])
+        }
+      }
+
+      // checkpoint our progress
+      await doCheckpoint('crawl_discussions', TABLE_VERSION, crawlSource, changedDiscussion.version)
+      emitProgressEvent(archive.url, 'crawl_discussions', ++progress, changedDiscussions.length)
+    }
+    logger.silly(`Finished crawling discussions`, {details: {url: archive.url}})
+  })
+}
+
+/**
+ * @description
+ * List crawled discussions.
+ *
+  * @param {Object} [opts]
+  * @param {Object} [opts.filters]
+  * @param {string|string[]} [opts.filters.authors]
+  * @param {string|string[]} [opts.filters.tags]
+  * @param {string} [opts.filters.visibility]
+  * @param {string} [opts.sortBy]
+  * @param {number} [opts.offset=0]
+  * @param {number} [opts.limit]
+  * @param {boolean} [opts.reverse]
+ * @returns {Promise<Array<Discussion>>}
+ */
+exports.list = async function (opts) {
+  // TODO: handle visibility
+  // TODO: sortBy options
+
+  // validate & parse params
+  if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'number', 'SortBy must be a string')
+  if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+  if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+  if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+  if (opts && opts.filters) {
+    if ('authors' in opts.filters) {
+      if (Array.isArray(opts.filters.authors)) {
+        assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        opts.filters.authors = [opts.filters.authors]
+      }
+      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+    }
+    if ('tags' in opts.filters) {
+      if (Array.isArray(opts.filters.tags)) {
+        assert(opts.filters.tags.every(v => typeof v === 'string'), 'Tags filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.tags === 'string', 'Tags filter must be a string or array of strings')
+        opts.filters.tags = [opts.filters.tags]
+      }
+    }
+  }
+
+  // build query
+  var sql = knex('crawl_discussions')
+    .select('crawl_discussions.*')
+    .select('crawl_sources.url as crawlSourceUrl')
+    .select(knex.raw('group_concat(crawl_tags.tag, ",") as tags'))
+    .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_discussions.crawlSourceId')
+    .leftJoin('crawl_discussions_tags', 'crawl_discussions_tags.crawlDiscussionId', '=', 'crawl_discussions.id')
+    .leftJoin('crawl_tags', 'crawl_discussions_tags.crawlTagId', '=', 'crawl_tags.id')
+    .groupBy('crawl_discussions.id')
+    .orderBy('crawl_discussions.createdAt', opts.reverse ? 'DESC' : 'ASC')
+  if (opts && opts.filters && opts.filters.authors) {
+    sql = sql.whereIn('crawl_sources.url', opts.filters.authors)
+  }
+  if (opts && opts.filters && opts.filters.tags) {
+    sql = sql.whereIn('crawl_tags.tag', opts.filters.tags)
+  }
+  if (opts && opts.limit) sql = sql.limit(opts.limit)
+  if (opts && opts.offset) sql = sql.offset(opts.offset)
+
+  // execute query
+  var rows = await db.all(sql)
+  return Promise.all(rows.map(massageDiscussionRow))
+}
+
+/**
+ * @description
+ * Get crawled discussion.
+ *
+ * @param {string} url - The URL of the discussion
+ * @returns {Promise<Discussion>}
+ */
+const get = exports.get = async function (url) {
+  // validate & parse params
+  var urlParsed
+  if (url) {
+    try { urlParsed = new URL(url) }
+    catch (e) { throw new Error('Invalid URL: ' + url) }
+  }
+
+  // build query
+  var sql = knex('crawl_discussions')
+    .select('crawl_discussions.*')
+    .select('crawl_sources.url as crawlSourceUrl')
+    .select(knex.raw('group_concat(crawl_tags.tag, ",") as tags'))
+    .innerJoin('crawl_sources', function () {
+      this.on('crawl_sources.id', '=', 'crawl_discussions.crawlSourceId')
+        .andOn('crawl_sources.url', '=', knex.raw('?', `${urlParsed.protocol}//${urlParsed.hostname}`))
+    })
+    .leftJoin('crawl_discussions_tags', 'crawl_discussions_tags.crawlDiscussionId', '=', 'crawl_discussions.id')
+    .leftJoin('crawl_tags', 'crawl_tags.id', '=', 'crawl_discussions_tags.crawlTagId')
+    .where('crawl_discussions.pathname', urlParsed.pathname)
+    .groupBy('crawl_discussions.id')
+
+  // execute query
+  return await massageDiscussionRow(await db.get(sql))
+}
+
+/**
+ * @description
+ * Create a new discussion.
+ *
+ * @param {InternalDatArchive} archive - where to write the discussion to.
+ * @param {Object} discussion
+ * @param {string} discussion.title
+ * @param {string} discussion.body
+ * @param {string} discussion.href
+ * @param {string[]} discussion.tags
+ * @param {string} discussion.visibility
+ * @returns {Promise<string>} url
+ */
+exports.add = async function (archive, discussion) {
+  // TODO visibility
+
+  var discussionObject = {
+    type: JSON_TYPE,
+    title: discussion.title,
+    body: discussion.body,
+    href: discussion.href,
+    tags: discussion.tags,
+    createdAt: (new Date()).toISOString()
+  }
+  var valid = validateDiscussion(discussionObject)
+  if (!valid) throw ajv.errorsText(validateDiscussion.errors)
+
+  var filename = generateTimeFilename()
+  var filepath = `/data/discussions/${filename}.json`
+  await ensureDirectory(archive, '/data')
+  await ensureDirectory(archive, '/data/discussions')
+  await archive.pda.writeFile(filepath, JSON.stringify(discussionObject, null, 2))
+  await crawler.crawlSite(archive)
+  return archive.url + filepath
+}
+
+/**
+ * @description
+ * Update the content of an existing discussion.
+ *
+ * @param {InternalDatArchive} archive - where to write the discussion to.
+ * @param {string} pathname - the pathname of the discussion.
+ * @param {Object} discussion
+ * @param {string} [discussion.title]
+ * @param {string} [discussion.body]
+ * @param {string} [discussion.href]
+ * @param {string[]} [discussion.tags]
+ * @param {string} [discussion.visibility]
+ * @returns {Promise<void>}
+ */
+exports.edit = async function (archive, pathname, discussion) {
+  // TODO visibility
+
+  var release = await lock('crawler:discussions:' + archive.url)
+  try {
+    // fetch discussion
+    var existingDiscussion = await get(archive.url + pathname)
+    if (!existingDiscussion) throw new Error('Discussion not found')
+
+    // update discussion content
+    var discussionObject = {
+      type: JSON_TYPE,
+      title: ('title' in discussion) ? discussion.title : existingDiscussion.title,
+      body: ('body' in discussion) ? discussion.body : existingDiscussion.body,
+      href: ('href' in discussion) ? discussion.href : existingDiscussion.href,
+      tags: ('tags' in discussion) ? discussion.tags : existingDiscussion.tags,
+      createdAt: existingDiscussion.createdAt,
+      updatedAt: (new Date()).toISOString()
+    }
+
+    // validate
+    var valid = validateDiscussion(discussionObject)
+    if (!valid) throw ajv.errorsText(validateDiscussion.errors)
+
+    // write
+    await archive.pda.writeFile(pathname, JSON.stringify(discussionObject, null, 2))
+    await crawler.crawlSite(archive)
+  } finally {
+    release()
+  }
+}
+
+/**
+ * @description
+ * Delete an existing discussion
+ *
+ * @param {InternalDatArchive} archive - where to write the discussion to.
+ * @param {string} pathname - the pathname of the discussion.
+ * @returns {Promise<void>}
+ */
+exports.remove = async function (archive, pathname) {
+  assert(typeof pathname === 'string', 'Remove() must be provided a valid URL string')
+  await archive.pda.unlink(pathname)
+  await crawler.crawlSite(archive)
+}
+
+// internal methods
+// =
+
+/**
+ * @param {string} origin
+ * @param {string} pathname
+ * @returns {string}
+ */
+function joinPath (origin, pathname) {
+  if (origin.endsWith('/') && pathname.startsWith('/')) {
+    return origin + pathname.slice(1)
+  }
+  if (!origin.endsWith('/') && !pathname.startsWith('/')) {
+    return origin + '/' + pathname
+  }
+  return origin + pathname
+}
+
+/**
+ * @param {Object} row
+ * @returns {Promise<Discussion>}
+ */
+async function massageDiscussionRow (row) {
+  if (!row) return null
+  var author = await siteDescriptions.getBest({subject: row.crawlSourceUrl})
+  if (!author) {
+    author = {
+      url: row.crawlSourceUrl,
+      title: '',
+      description: '',
+      type: [],
+      thumbUrl: `${row.crawlSourceUrl}/thumb`,
+      descAuthor: {url: null}
+    }
+  }
+  return {
+    pathname: row.pathname,
+    author,
+    title: row.title,
+    body: row.body,
+    href: row.href,
+    tags: row.tags ? row.tags.split(',').filter(Boolean) : [],
+    createdAt: new Date(row.createdAt).toISOString(),
+    updatedAt: row.updatedAt ? new Date(row.updatedAt).toISOString() : null,
+    visibility: 'public' // TODO visibility
+  }
+}
diff --git a/crawler/index.js b/crawler/index.js
index 0cb4ebb7..64f36bf0 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -7,10 +7,11 @@ const archivesDb = require('../dbs/archives')
 const dat = require('../dat')
 
 const {crawlerEvents, toHostname} = require('./util')
-const comments = require('./comments')
-const posts = require('./posts')
 const bookmarks = require('./bookmarks')
+const comments = require('./comments')
+const discussions = require('./discussions')
 const follows = require('./follows')
+const posts = require('./posts')
 const reactions = require('./reactions')
 const siteDescriptions = require('./site-descriptions')
 const votes = require('./votes')
@@ -23,10 +24,11 @@ var watches = {}
 // exported api
 // =
 
-exports.comments = comments
-exports.posts = posts
 exports.bookmarks = bookmarks
+exports.comments = comments
+exports.discussions = discussions
 exports.follows = follows
+exports.posts = posts
 exports.reactions = reactions
 exports.siteDescriptions = siteDescriptions
 exports.votes = votes
@@ -89,10 +91,11 @@ exports.crawlSite = async function (archive) {
 
     // crawl individual sources
     await Promise.all([
-      comments.crawlSite(archive, crawlSource),
-      posts.crawlSite(archive, crawlSource),
       bookmarks.crawlSite(archive, crawlSource),
+      comments.crawlSite(archive, crawlSource),
+      discussions.crawlSite(archive, crawlSource),
       follows.crawlSite(archive, crawlSource),
+      posts.crawlSite(archive, crawlSource),
       reactions.crawlSite(archive, crawlSource),
       siteDescriptions.crawlSite(archive, crawlSource),
       votes.crawlSite(archive, crawlSource)
diff --git a/crawler/json-schemas/discussion.js b/crawler/json-schemas/discussion.js
new file mode 100644
index 00000000..ba561eea
--- /dev/null
+++ b/crawler/json-schemas/discussion.js
@@ -0,0 +1,43 @@
+module.exports = {
+  '$schema': 'http://json-schema.org/draft-07/schema#',
+  '$id': 'dat://unwalled.garden/discussion.json',
+  'type': 'object',
+  'title': 'Discussion',
+  'description': 'A forum discussion.',
+  'required': ['type', 'title', 'createdAt'],
+  'properties': {
+    'type': {
+      'type': 'string',
+      'description': "The object's type",
+      'const': 'unwalled.garden/discussion'
+    },
+    'title': {
+      'type': 'string',
+      'maxLength': 280
+    },
+    'body': {
+      'type': 'string',
+      'maxLength': 1000000
+    },
+    'href': {
+      'type': 'string',
+      'format': 'uri'
+    },
+    'tags': {
+      'type': 'array',
+      'items': {
+        'type': 'string',
+        'maxLength': 100,
+        'pattern': '^[A-Za-z][A-Za-z0-9-_?]*$'
+      }
+    },
+    'createdAt': {
+      'type': 'string',
+      'format': 'date-time'
+    },
+    'updatedAt': {
+      'type': 'string',
+      'format': 'date-time'
+    }
+  }
+}
\ No newline at end of file
diff --git a/dbs/profile-data-db.js b/dbs/profile-data-db.js
index 915947ee..d1f78311 100644
--- a/dbs/profile-data-db.js
+++ b/dbs/profile-data-db.js
@@ -116,7 +116,8 @@ migrations = [
   migration('profile-data.v26.sql'),
   migration('profile-data.v27.sql'),
   migration('profile-data.v28.sql'),
-  migration('profile-data.v29.sql')
+  migration('profile-data.v29.sql'),
+  migration('profile-data.v30.sql')
 ]
 function migration (file, opts = {}) {
   return cb => {
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index b2f0521c..e9dec02e 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -297,6 +297,32 @@ CREATE TABLE crawl_follows (
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
 
+-- crawled discussions
+CREATE TABLE crawl_discussions (
+  id INTEGER PRIMARY KEY,
+  crawlSourceId INTEGER NOT NULL,
+  pathname TEXT NOT NULL,
+  crawledAt INTEGER,
+  
+  title TEXT NOT NULL,
+  body TEXT,
+  href TEXT,
+  createdAt INTEGER,
+  updatedAt INTEGER,
+
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+CREATE INDEX crawl_discussions_url ON crawl_discussions (crawlSourceId, pathname);
+
+-- crawled discussion tags
+CREATE TABLE crawl_discussions_tags (
+  crawlDiscussionId INTEGER,
+  crawlTagId INTEGER,
+
+  FOREIGN KEY (crawlDiscussionId) REFERENCES crawl_discussions (id) ON DELETE CASCADE,
+  FOREIGN KEY (crawlTagId) REFERENCES crawl_tags (id) ON DELETE CASCADE
+);
+
 -- a list of the draft-dats for a master-dat
 -- deprecated
 CREATE TABLE archive_drafts (
@@ -360,5 +386,5 @@ INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Library', 'beaker://library/', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker.Social', 'dat://beaker.social', 1);
 
-PRAGMA user_version = 29;
+PRAGMA user_version = 30;
 `
diff --git a/dbs/schemas/profile-data.v30.sql.js b/dbs/schemas/profile-data.v30.sql.js
new file mode 100644
index 00000000..14c8f107
--- /dev/null
+++ b/dbs/schemas/profile-data.v30.sql.js
@@ -0,0 +1,30 @@
+module.exports = `
+
+-- add crawled discussions
+CREATE TABLE crawl_discussions (
+  id INTEGER PRIMARY KEY,
+  crawlSourceId INTEGER NOT NULL,
+  pathname TEXT NOT NULL,
+  crawledAt INTEGER,
+  
+  title TEXT NOT NULL,
+  body TEXT,
+  href TEXT,
+  createdAt INTEGER,
+  updatedAt INTEGER,
+
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+CREATE INDEX crawl_discussions_url ON crawl_discussions (crawlSourceId, pathname);
+
+-- add discussion <-> tag join table
+CREATE TABLE crawl_discussions_tags (
+  crawlDiscussionId INTEGER,
+  crawlTagId INTEGER,
+
+  FOREIGN KEY (crawlDiscussionId) REFERENCES crawl_discussions (id) ON DELETE CASCADE,
+  FOREIGN KEY (crawlTagId) REFERENCES crawl_tags (id) ON DELETE CASCADE
+);
+
+PRAGMA user_version = 30;
+`
\ No newline at end of file
diff --git a/web-apis/bg.js b/web-apis/bg.js
index c6ebeb91..7f59dd17 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -30,8 +30,9 @@ const libraryManifest = require('./manifests/external/library')
 const profilesManifest = require('./manifests/external/profiles')
 const searchManifest = require('./manifests/external/search')
 const commentsManifest = require('./manifests/external/unwalled-garden-comments')
-const postsManifest = require('./manifests/external/unwalled-garden-posts')
+const discussionsManifest = require('./manifests/external/unwalled-garden-discussions')
 const followsManifest = require('./manifests/external/unwalled-garden-follows')
+const postsManifest = require('./manifests/external/unwalled-garden-posts')
 const reactionsManifest = require('./manifests/external/unwalled-garden-reactions')
 const votesManifest = require('./manifests/external/unwalled-garden-votes')
 
@@ -43,8 +44,9 @@ const libraryAPI = require('./bg/library')
 const profilesAPI = require('./bg/profiles')
 const searchAPI = require('./bg/search')
 const commentsAPI = require('./bg/unwalled-garden-comments')
-const postsAPI = require('./bg/unwalled-garden-posts')
+const discussionsAPI = require('./bg/unwalled-garden-discussions')
 const followsAPI = require('./bg/unwalled-garden-follows')
+const postsAPI = require('./bg/unwalled-garden-posts')
 const reactionsAPI = require('./bg/unwalled-garden-reactions')
 const votesAPI = require('./bg/unwalled-garden-votes')
 
@@ -81,8 +83,9 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('profiles', profilesManifest, profilesAPI, secureOnly)
   globals.rpcAPI.exportAPI('search', searchManifest, searchAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-comments', commentsManifest, commentsAPI, secureOnly)
-  globals.rpcAPI.exportAPI('unwalled-garden-posts', postsManifest, postsAPI, secureOnly)
+  globals.rpcAPI.exportAPI('unwalled-garden-discussions', discussionsManifest, discussionsAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-follows', followsManifest, followsAPI, secureOnly)
+  globals.rpcAPI.exportAPI('unwalled-garden-posts', postsManifest, postsAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-reactions', reactionsManifest, reactionsAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-votes', votesManifest, votesAPI, secureOnly)
 
diff --git a/web-apis/bg/unwalled-garden-discussions.js b/web-apis/bg/unwalled-garden-discussions.js
new file mode 100644
index 00000000..8c57b7bb
--- /dev/null
+++ b/web-apis/bg/unwalled-garden-discussions.js
@@ -0,0 +1,223 @@
+const globals = require('../../globals')
+const assert = require('assert')
+const {URL} = require('url')
+const {PermissionsError} = require('beaker-error-constants')
+const dat = require('../../dat')
+const discussionsCrawler = require('../../crawler/discussions')
+
+// typedefs
+// =
+
+/**
+ * @typedef {Object} DiscussionAuthorPublicAPIRecord
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {string[]} type
+ *
+ * @typedef {Object} DiscussionPublicAPIRecord
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {string} body
+ * @prop {string} href
+ * @prop {string[]} tags
+ * @prop {string} createdAt
+ * @prop {string} updatedAt
+ * @prop {DiscussionAuthorPublicAPIRecord} author
+ * @prop {string} visibility
+ */
+
+// exported api
+// =
+
+module.exports = {
+  /**
+   * @param {Object} [opts]
+   * @param {Object} [opts.filters]
+   * @param {string|string[]} [opts.filters.authors]
+   * @param {string|string[]} [opts.filters.tags]
+   * @param {string} [opts.filters.visibility]
+   * @param {string} [opts.sortBy]
+   * @param {number} [opts.offset=0]
+   * @param {number} [opts.limit]
+   * @param {boolean} [opts.reverse]
+   * @returns {Promise<DiscussionPublicAPIRecord[]>}
+   */
+  async list (opts) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    opts = (opts && typeof opts === 'object') ? opts : {}
+    if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
+    if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+    if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+    if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+    if (opts && opts.filters) {
+      if ('authors' in opts.filters) {
+        if (Array.isArray(opts.filters.authors)) {
+          assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        }
+      }
+      if ('tags' in opts.filters) {
+        if (Array.isArray(opts.filters.tags)) {
+          assert(opts.filters.tags.every(v => typeof v === 'string'), 'Tags filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.tags === 'string', 'Tags filter must be a string or array of strings')
+        }
+      }
+      if ('visibility' in opts.filters) {
+        assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+      }
+    }
+    var discussions = await discussionsCrawler.list(opts)
+    return Promise.all(discussions.map(massageDiscussionRecord))
+  },
+
+  /**
+   * @param {string} url
+   * @returns {Promise<DiscussionPublicAPIRecord>}
+   */
+  async get (url) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    return massageDiscussionRecord(await discussionsCrawler.get(url))
+  },
+
+  /**
+   * @param {Object} discussion
+   * @param {string} discussion.title
+   * @param {string} discussion.body
+   * @param {string} discussion.href
+   * @param {string[]} discussion.tags
+   * @param {string} discussion.visibility
+   * @returns {Promise<DiscussionPublicAPIRecord>}
+   */
+  async add (discussion) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    var userArchive = getUserArchive(this.sender)
+
+    assert(discussion && typeof discussion === 'object', 'The `discussion` parameter must be a string or object')
+    assert(discussion.title && typeof discussion.title === 'string', 'The `discussion.title` parameter must be a non-empty string')
+    if ('body' in discussion) assert(typeof discussion.body === 'string', 'The `discussion.body` parameter must be a string')
+    if ('href' in discussion) assert(typeof discussion.href === 'string', 'The `discussion.href` parameter must be a string')
+    if ('tags' in discussion) assert(discussion.tags.every(tag => typeof tag === 'string'), 'The `discussion.tags` parameter must be an array of strings')
+    if ('visibility' in discussion) assert(typeof discussion.visibility === 'string', 'The `discussion.visibility` parameter must be "public" or "private"')
+
+    // default values
+    if (!discussion.visibility) {
+      discussion.visibility = 'public'
+    }
+
+    var url = await discussionsCrawler.add(userArchive, discussion)
+    return massageDiscussionRecord(await discussionsCrawler.get(url))
+  },
+
+  /**
+   * @param {string} url
+   * @param {Object} discussion
+   * @param {string} discussion.title
+   * @param {string} discussion.body
+   * @param {string} discussion.href
+   * @param {string[]} discussion.tags
+   * @param {string} discussion.visibility
+   * @returns {Promise<DiscussionPublicAPIRecord>}
+   */
+  async edit (url, discussion) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    var userArchive = getUserArchive(this.sender)
+
+    assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
+    assert(discussion && typeof discussion === 'object', 'The `discussion` parameter must be a string or object')
+    if ('title' in discussion) assert(discussion.title && typeof discussion.title === 'string', 'The `discussion.title` parameter must be a non-empty string')
+    if ('body' in discussion) assert(typeof discussion.body === 'string', 'The `discussion.body` parameter must be a string')
+    if ('href' in discussion) assert(typeof discussion.href === 'string', 'The `discussion.href` parameter must be a string')
+    if ('tags' in discussion) assert(discussion.tags.every(tag => typeof tag === 'string'), 'The `discussion.tags` parameter must be an array of strings')
+    if ('visibility' in discussion) assert(typeof discussion.visibility === 'string', 'The `discussion.visibility` parameter must be "public" or "private"')
+
+    var filepath = await urlToFilepath(url, userArchive.url)
+    await discussionsCrawler.edit(userArchive, filepath, discussion)
+    return massageDiscussionRecord(await discussionsCrawler.get(userArchive.url + filepath))
+  },
+
+  /**
+   * @param {string} url
+   * @returns {Promise<void>}
+   */
+  async remove (url) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    var userArchive = getUserArchive(this.sender)
+
+    assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
+
+    var filepath = await urlToFilepath(url, userArchive.url)
+    await discussionsCrawler.remove(userArchive, filepath)
+  }
+}
+
+// internal methods
+// =
+
+async function assertPermission (sender, perm) {
+  if (sender.getURL().startsWith('beaker:')) {
+    return true
+  }
+  if (await globals.permsAPI.requestPermission(perm, sender)) return true
+  throw new PermissionsError()
+}
+
+function getUserArchive (sender) {
+  var userSession = globals.userSessionAPI.getFor(sender)
+  if (!userSession) throw new Error('No active user session')
+  return dat.library.getArchive(userSession.url)
+}
+
+/**
+ * Tries to parse the URL and return the pathname. If fails, assumes the string was a pathname.
+ * @param {string} url
+ * @returns {Promise<string>}
+ */
+async function urlToFilepath (url, origin) {
+  var urlp
+  var filepath
+  try {
+    // if `url` is a full URL, extract the path
+    urlp = new URL(url)
+    filepath = urlp.pathname
+  } catch (e) {
+    // assume `url` is a path
+    return url
+  }
+
+  // double-check the origin
+  var key = await dat.dns.resolveName(urlp.hostname)
+  var urlp2 = new URL(origin)
+  if (key !== urlp2.hostname) {
+    throw new Error('Unable to edit discussions on other sites than your own')
+  }
+
+  return filepath
+}
+
+/**
+ * @param {Object} discussion
+ * @returns {DiscussionPublicAPIRecord}
+ */
+function massageDiscussionRecord (discussion) {
+  if (!discussion) return null
+  var url =  discussion.author.url + discussion.pathname
+  return {
+    url,
+    title: discussion.title,
+    body: discussion.body,
+    href: discussion.href,
+    tags: discussion.tags,
+    createdAt: discussion.createdAt,
+    updatedAt: discussion.updatedAt,
+    author: {
+      url: discussion.author.url,
+      title: discussion.author.title,
+      description: discussion.author.description,
+      type: discussion.author.type
+    },
+    visibility: discussion.visibility
+  }
+}
diff --git a/web-apis/fg/navigator-import.js b/web-apis/fg/navigator-import.js
index f99af301..7623b275 100644
--- a/web-apis/fg/navigator-import.js
+++ b/web-apis/fg/navigator-import.js
@@ -32,14 +32,18 @@ const APIs = {
     manifest: require('../manifests/external/unwalled-garden-comments'),
     create: makeCreateFn('unwalled-garden-comments')
   },
-  'unwalled-garden-posts': {
-    manifest: require('../manifests/external/unwalled-garden-posts'),
-    create: makeCreateFn('unwalled-garden-posts')
+  'unwalled-garden-discussions': {
+    manifest: require('../manifests/external/unwalled-garden-discussions'),
+    create: makeCreateFn('unwalled-garden-discussions')
   },
   'unwalled-garden-follows': {
     manifest: require('../manifests/external/unwalled-garden-follows'),
     create: makeCreateFn('unwalled-garden-follows')
   },
+  'unwalled-garden-posts': {
+    manifest: require('../manifests/external/unwalled-garden-posts'),
+    create: makeCreateFn('unwalled-garden-posts')
+  },
   'unwalled-garden-reactions': {
     manifest: require('../manifests/external/unwalled-garden-reactions'),
     create: makeCreateFn('unwalled-garden-reactions')
diff --git a/web-apis/manifests/external/unwalled-garden-discussions.js b/web-apis/manifests/external/unwalled-garden-discussions.js
new file mode 100644
index 00000000..06aeb28a
--- /dev/null
+++ b/web-apis/manifests/external/unwalled-garden-discussions.js
@@ -0,0 +1,7 @@
+module.exports = {
+  list: 'promise',
+  get: 'promise',
+  add: 'promise',
+  edit: 'promise',
+  remove: 'promise'
+}
\ No newline at end of file

From 5440b0d584940a308a984b3b9ff19cedb9df4088 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 18 Jun 2019 11:19:36 -0500
Subject: [PATCH 188/245] Add unwalled-garden-media web api

---
 crawler/discussions.js                        |  15 -
 crawler/index.js                              |   3 +
 crawler/json-schemas/media.js                 |  52 ++
 crawler/media.js                              | 443 ++++++++++++++++++
 dbs/profile-data-db.js                        |   3 +-
 dbs/schemas/profile-data.sql.js               |  52 +-
 dbs/schemas/profile-data.v31.sql.js           |  46 ++
 web-apis/bg.js                                |   3 +
 web-apis/bg/unwalled-garden-discussions.js    |   2 +-
 web-apis/bg/unwalled-garden-media.js          | 245 ++++++++++
 web-apis/fg/navigator-import.js               |   4 +
 .../external/unwalled-garden-media.js         |   7 +
 12 files changed, 853 insertions(+), 22 deletions(-)
 create mode 100644 crawler/json-schemas/media.js
 create mode 100644 crawler/media.js
 create mode 100644 dbs/schemas/profile-data.v31.sql.js
 create mode 100644 web-apis/bg/unwalled-garden-media.js
 create mode 100644 web-apis/manifests/external/unwalled-garden-media.js

diff --git a/crawler/discussions.js b/crawler/discussions.js
index c0326996..2fedfc7b 100644
--- a/crawler/discussions.js
+++ b/crawler/discussions.js
@@ -381,21 +381,6 @@ exports.remove = async function (archive, pathname) {
 // internal methods
 // =
 
-/**
- * @param {string} origin
- * @param {string} pathname
- * @returns {string}
- */
-function joinPath (origin, pathname) {
-  if (origin.endsWith('/') && pathname.startsWith('/')) {
-    return origin + pathname.slice(1)
-  }
-  if (!origin.endsWith('/') && !pathname.startsWith('/')) {
-    return origin + '/' + pathname
-  }
-  return origin + pathname
-}
-
 /**
  * @param {Object} row
  * @returns {Promise<Discussion>}
diff --git a/crawler/index.js b/crawler/index.js
index 64f36bf0..af09dd41 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -11,6 +11,7 @@ const bookmarks = require('./bookmarks')
 const comments = require('./comments')
 const discussions = require('./discussions')
 const follows = require('./follows')
+const media = require('./media')
 const posts = require('./posts')
 const reactions = require('./reactions')
 const siteDescriptions = require('./site-descriptions')
@@ -28,6 +29,7 @@ exports.bookmarks = bookmarks
 exports.comments = comments
 exports.discussions = discussions
 exports.follows = follows
+exports.media = media
 exports.posts = posts
 exports.reactions = reactions
 exports.siteDescriptions = siteDescriptions
@@ -95,6 +97,7 @@ exports.crawlSite = async function (archive) {
       comments.crawlSite(archive, crawlSource),
       discussions.crawlSite(archive, crawlSource),
       follows.crawlSite(archive, crawlSource),
+      media.crawlSite(archive, crawlSource),
       posts.crawlSite(archive, crawlSource),
       reactions.crawlSite(archive, crawlSource),
       siteDescriptions.crawlSite(archive, crawlSource),
diff --git a/crawler/json-schemas/media.js b/crawler/json-schemas/media.js
new file mode 100644
index 00000000..c904f02c
--- /dev/null
+++ b/crawler/json-schemas/media.js
@@ -0,0 +1,52 @@
+module.exports = {
+  '$schema': 'http://json-schema.org/draft-07/schema#',
+  '$id': 'dat://unwalled.garden/media.json',
+  'type': 'object',
+  'title': 'media',
+  'description': 'A published item of content.',
+  'required': [
+    'type',
+    'subtype',
+    'href',
+    'title',
+    'createdAt'
+  ],
+  'properties': {
+    'type': {
+      'type': 'string',
+      'const': 'unwalled.garden/media'
+    },
+    'subtype': {
+      'type': 'string'
+    },
+    'href': {
+      'type': 'string',
+      'format': 'uri'
+    },
+    'title': {
+      'type': 'string'
+    },
+    'description': {
+      'type': 'string'
+    },
+    'tags': {
+      'type': 'array',
+      'items': {
+        'type': 'string',
+        'maxLength': 100,
+        'pattern': '^[A-Za-z][A-Za-z0-9-_?]*$'
+      }
+    },
+    'createdAt': {
+      'type': 'string',
+      'format': 'date-time'
+    },
+    'updatedAt': {
+      'type': 'string',
+      'format': 'date-time'
+    },
+    'ext': {
+      'type': 'object'
+    }
+  }
+}
\ No newline at end of file
diff --git a/crawler/media.js b/crawler/media.js
new file mode 100644
index 00000000..41b53932
--- /dev/null
+++ b/crawler/media.js
@@ -0,0 +1,443 @@
+const assert = require('assert')
+const {URL} = require('url')
+const Events = require('events')
+const Ajv = require('ajv')
+const logger = require('../logger').child({category: 'crawler', dataset: 'media'})
+const db = require('../dbs/profile-data-db')
+const crawler = require('./index')
+const lock = require('../lib/lock')
+const knex = require('../lib/knex')
+const siteDescriptions = require('./site-descriptions')
+const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename, ensureDirectory, toOrigin} = require('./util')
+const mediaSchema = require('./json-schemas/media')
+
+// constants
+// =
+
+const TABLE_VERSION = 1
+const JSON_TYPE = 'unwalled.garden/media'
+const JSON_PATH_REGEX = /^\/data\/media\/([^/]+)\.json$/i
+
+// typedefs
+// =
+
+/**
+ * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
+ * @typedef {import('./util').CrawlSourceRecord} CrawlSourceRecord
+ * @typedef { import("./site-descriptions").SiteDescription } SiteDescription
+ *
+ * @typedef {Object} Media
+ * @prop {string} pathname
+ * @prop {string} subtype
+ * @prop {string} href
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {string[]} tags
+ * @prop {string} createdAt
+ * @prop {string} updatedAt
+ * @prop {SiteDescription} author
+ * @prop {string} visibility
+ */
+
+// globals
+// =
+
+const events = new Events()
+const ajv = (new Ajv())
+const validateMedia = ajv.compile(mediaSchema)
+
+// exported api
+// =
+
+exports.on = events.on.bind(events)
+exports.addListener = events.addListener.bind(events)
+exports.removeListener = events.removeListener.bind(events)
+
+/**
+ * @description
+ * Crawl the given site for media.
+ *
+ * @param {InternalDatArchive} archive - site to crawl.
+ * @param {CrawlSourceRecord} crawlSource - internal metadata about the crawl target.
+ * @returns {Promise}
+ */
+exports.crawlSite = async function (archive, crawlSource) {
+  return doCrawl(archive, crawlSource, 'crawl_media', TABLE_VERSION, async ({changes, resetRequired}) => {
+    const supressEvents = resetRequired === true // dont emit when replaying old info
+    logger.silly('Crawling media', {details: {url: archive.url, numChanges: changes.length, resetRequired}})
+    if (resetRequired) {
+      // reset all data
+      logger.debug('Resetting dataset', {details: {url: archive.url}})
+      await db.run(`
+        DELETE FROM crawl_media WHERE crawlSourceId = ?
+      `, [crawlSource.id])
+      await doCheckpoint('crawl_media', TABLE_VERSION, crawlSource, 0)
+    }
+
+    // collect changed media
+    var changedMedia = getMatchingChangesInOrder(changes, JSON_PATH_REGEX)
+    if (changedMedia.length) {
+      logger.verbose('Collected new/changed media files', {details: {url: archive.url, changedMedia: changedMedia.map(p => p.name)}})
+    } else {
+      logger.debug('No new media-files found', {details: {url: archive.url}})
+    }
+    emitProgressEvent(archive.url, 'crawl_media', 0, changedMedia.length)
+
+    // read and apply each media in order
+    var progress = 0
+    for (let changedMediaItem of changedMedia) {
+      // TODO Currently the crawler will abort reading the feed if any media fails to load
+      //      this means that a single unreachable file can stop the forward progress of media indexing
+      //      to solve this, we need to find a way to tolerate unreachable media-files without losing our ability to efficiently detect new media
+      //      -prf
+      if (changedMediaItem.type === 'del') {
+        // delete
+        await db.run(`
+          DELETE FROM crawl_media WHERE crawlSourceId = ? AND pathname = ?
+        `, [crawlSource.id, changedMediaItem.name])
+        events.emit('media-removed', archive.url)
+      } else {
+        // read
+        let mediaString
+        try {
+          mediaString = await archive.pda.readFile(changedMediaItem.name, 'utf8')
+        } catch (err) {
+          logger.warn('Failed to read media file, aborting', {details: {url: archive.url, name: changedMediaItem.name, err}})
+          return // abort indexing
+        }
+
+        // parse and validate
+        let media
+        try {
+          media = JSON.parse(mediaString)
+          let valid = validateMedia(media)
+          if (!valid) throw ajv.errorsText(validateMedia.errors)
+        } catch (err) {
+          logger.warn('Failed to parse media file, skipping', {details: {url: archive.url, name: changedMediaItem.name, err}})
+          continue // skip
+        }
+
+        // massage the media
+        media.createdAt = Number(new Date(media.createdAt))
+        media.updatedAt = Number(new Date(media.updatedAt))
+        if (!media.description) media.description = '' // optional
+        if (!media.tags) media.tags = [] // optional
+        if (isNaN(media.updatedAt)) media.updatedAt = 0 // optional
+
+        // upsert
+        let mediaId = 0
+        let existingMedia = await db.get(knex('crawl_media')
+          .select('id')
+          .where({
+            crawlSourceId: crawlSource.id,
+            pathname: changedMediaItem.name
+          })
+        )
+        if (existingMedia) {
+          await db.run(knex('crawl_media')
+            .where({
+              crawlSourceId: crawlSource.id,
+              pathname: changedMediaItem.name
+            }).update({
+              crawledAt: Date.now(),
+              subtype: media.subtype,
+              href: media.href,
+              title: media.title,
+              description: media.description,
+              createdAt: media.createdAt,
+              updatedAt: media.updatedAt,
+            })
+          )
+          mediaId = existingMedia.id
+          events.emit('media-updated', archive.url)
+        } else {
+          let res = await db.run(knex('crawl_media')
+            .insert({
+              crawlSourceId: crawlSource.id,
+              pathname: changedMediaItem.name,
+              crawledAt: Date.now(),
+              subtype: media.subtype,
+              href: media.href,
+              title: media.title,
+              description: media.description,
+              createdAt: media.createdAt,
+              updatedAt: media.updatedAt,
+            })
+          )
+          mediaId = +res.lastID
+          events.emit('media-added', archive.url)
+        }
+        await db.run(`DELETE FROM crawl_media_tags WHERE crawlMediaId = ?`, [mediaId])
+        for (let tag of media.tags) {
+          await db.run(`INSERT OR IGNORE INTO crawl_tags (tag) VALUES (?)`, [tag])
+          let tagRow = await db.get(`SELECT id FROM crawl_tags WHERE tag = ?`, [tag])
+          await db.run(`INSERT INTO crawl_media_tags (crawlMediaId, crawlTagId) VALUES (?, ?)`, [mediaId, tagRow.id])
+        }
+      }
+
+      // checkpoint our progress
+      await doCheckpoint('crawl_media', TABLE_VERSION, crawlSource, changedMediaItem.version)
+      emitProgressEvent(archive.url, 'crawl_media', ++progress, changedMedia.length)
+    }
+    logger.silly(`Finished crawling media`, {details: {url: archive.url}})
+  })
+}
+
+/**
+ * @description
+ * List crawled media.
+ *
+  * @param {Object} [opts]
+  * @param {Object} [opts.filters]
+  * @param {string|string[]} [opts.filters.authors]
+  * @param {string|string[]} [opts.filters.hrefs]
+  * @param {string|string[]} [opts.filters.subtypes]
+  * @param {string|string[]} [opts.filters.tags]
+  * @param {string} [opts.filters.visibility]
+  * @param {string} [opts.sortBy]
+  * @param {number} [opts.offset=0]
+  * @param {number} [opts.limit]
+  * @param {boolean} [opts.reverse]
+ * @returns {Promise<Array<Media>>}
+ */
+exports.list = async function (opts) {
+  // TODO: handle visibility
+  // TODO: sortBy options
+
+  // validate & parse params
+  if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'number', 'SortBy must be a string')
+  if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+  if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+  if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+  if (opts && opts.filters) {
+    if ('authors' in opts.filters) {
+      if (Array.isArray(opts.filters.authors)) {
+        assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        opts.filters.authors = [opts.filters.authors]
+      }
+      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+    }
+    if ('hrefs' in opts.filters) {
+      if (Array.isArray(opts.filters.hrefs)) {
+        assert(opts.filters.hrefs.every(v => typeof v === 'string'), 'Hrefs filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.hrefs === 'string', 'Hrefs filter must be a string or array of strings')
+        opts.filters.hrefs = [opts.filters.hrefs]
+      }
+    }
+    if ('subtypes' in opts.filters) {
+      if (Array.isArray(opts.filters.subtypes)) {
+        assert(opts.filters.subtypes.every(v => typeof v === 'string'), 'Subtypes filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.subtypes === 'string', 'Subtypes filter must be a string or array of strings')
+        opts.filters.subtypes = [opts.filters.subtypes]
+      }
+    }
+    if ('tags' in opts.filters) {
+      if (Array.isArray(opts.filters.tags)) {
+        assert(opts.filters.tags.every(v => typeof v === 'string'), 'Tags filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.tags === 'string', 'Tags filter must be a string or array of strings')
+        opts.filters.tags = [opts.filters.tags]
+      }
+    }
+  }
+
+  // build query
+  var sql = knex('crawl_media')
+    .select('crawl_media.*')
+    .select('crawl_sources.url as crawlSourceUrl')
+    .select(knex.raw('group_concat(crawl_tags.tag, ",") as tags'))
+    .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_media.crawlSourceId')
+    .leftJoin('crawl_media_tags', 'crawl_media_tags.crawlMediaId', '=', 'crawl_media.id')
+    .leftJoin('crawl_tags', 'crawl_media_tags.crawlTagId', '=', 'crawl_tags.id')
+    .groupBy('crawl_media.id')
+    .orderBy('crawl_media.createdAt', opts.reverse ? 'DESC' : 'ASC')
+  if (opts && opts.filters && opts.filters.authors) {
+    sql = sql.whereIn('crawl_sources.url', opts.filters.authors)
+  }
+  if (opts && opts.filters && opts.filters.hrefs) {
+    sql = sql.whereIn('crawl_media.href', opts.filters.hrefs)
+  }
+  if (opts && opts.filters && opts.filters.subtypes) {
+    sql = sql.whereIn('crawl_media.subtype', opts.filters.subtypes)
+  }
+  if (opts && opts.filters && opts.filters.tags) {
+    sql = sql.whereIn('crawl_tags.tag', opts.filters.tags)
+  }
+  if (opts && opts.limit) sql = sql.limit(opts.limit)
+  if (opts && opts.offset) sql = sql.offset(opts.offset)
+
+  // execute query
+  var rows = await db.all(sql)
+  return Promise.all(rows.map(massageMediaRow))
+}
+
+/**
+ * @description
+ * Get crawled media.
+ *
+ * @param {string} url - The URL of the media
+ * @returns {Promise<Media>}
+ */
+const get = exports.get = async function (url) {
+  // validate & parse params
+  var urlParsed
+  if (url) {
+    try { urlParsed = new URL(url) }
+    catch (e) { throw new Error('Invalid URL: ' + url) }
+  }
+
+  // build query
+  var sql = knex('crawl_media')
+    .select('crawl_media.*')
+    .select('crawl_sources.url as crawlSourceUrl')
+    .select(knex.raw('group_concat(crawl_tags.tag, ",") as tags'))
+    .innerJoin('crawl_sources', function () {
+      this.on('crawl_sources.id', '=', 'crawl_media.crawlSourceId')
+        .andOn('crawl_sources.url', '=', knex.raw('?', `${urlParsed.protocol}//${urlParsed.hostname}`))
+    })
+    .leftJoin('crawl_media_tags', 'crawl_media_tags.crawlMediaId', '=', 'crawl_media.id')
+    .leftJoin('crawl_tags', 'crawl_tags.id', '=', 'crawl_media_tags.crawlTagId')
+    .where('crawl_media.pathname', urlParsed.pathname)
+    .groupBy('crawl_media.id')
+
+  // execute query
+  return await massageMediaRow(await db.get(sql))
+}
+
+/**
+ * @description
+ * Create a new media.
+ *
+ * @param {InternalDatArchive} archive - where to write the media to.
+ * @param {Object} media
+ * @param {string} media.subtype
+ * @param {string} media.href
+ * @param {string} media.title
+ * @param {string} media.description
+ * @param {string[]} media.tags
+ * @param {string} media.visibility
+ * @returns {Promise<string>} url
+ */
+exports.add = async function (archive, media) {
+  // TODO visibility
+
+  var mediaObject = {
+    type: JSON_TYPE,
+    subtype: media.subtype,
+    href: media.href,
+    title: media.title,
+    description: media.description,
+    tags: media.tags,
+    createdAt: (new Date()).toISOString()
+  }
+  var valid = validateMedia(mediaObject)
+  if (!valid) throw ajv.errorsText(validateMedia.errors)
+
+  var filename = generateTimeFilename()
+  var filepath = `/data/media/${filename}.json`
+  await ensureDirectory(archive, '/data')
+  await ensureDirectory(archive, '/data/media')
+  await archive.pda.writeFile(filepath, JSON.stringify(mediaObject, null, 2))
+  await crawler.crawlSite(archive)
+  return archive.url + filepath
+}
+
+/**
+ * @description
+ * Update the content of an existing media.
+ *
+ * @param {InternalDatArchive} archive - where to write the media to.
+ * @param {string} pathname - the pathname of the media.
+ * @param {Object} media
+ * @param {string} [media.subtype]
+ * @param {string} [media.href]
+ * @param {string} [media.title]
+ * @param {string} [media.description]
+ * @param {string[]} [media.tags]
+ * @param {string} [media.visibility]
+ * @returns {Promise<void>}
+ */
+exports.edit = async function (archive, pathname, media) {
+  // TODO visibility
+
+  var release = await lock('crawler:media:' + archive.url)
+  try {
+    // fetch media
+    var existingMedia = await get(archive.url + pathname)
+    if (!existingMedia) throw new Error('Media not found')
+
+    // update media content
+    var mediaObject = {
+      type: JSON_TYPE,
+      subtype: ('subtype' in media) ? media.subtype : existingMedia.subtype,
+      href: ('href' in media) ? media.href : existingMedia.href,
+      title: ('title' in media) ? media.title : existingMedia.title,
+      description: ('description' in media) ? media.description : existingMedia.description,
+      tags: ('tags' in media) ? media.tags : existingMedia.tags,
+      createdAt: existingMedia.createdAt,
+      updatedAt: (new Date()).toISOString()
+    }
+
+    // validate
+    var valid = validateMedia(mediaObject)
+    if (!valid) throw ajv.errorsText(validateMedia.errors)
+
+    // write
+    await archive.pda.writeFile(pathname, JSON.stringify(mediaObject, null, 2))
+    await crawler.crawlSite(archive)
+  } finally {
+    release()
+  }
+}
+
+/**
+ * @description
+ * Delete an existing media
+ *
+ * @param {InternalDatArchive} archive - where to write the media to.
+ * @param {string} pathname - the pathname of the media.
+ * @returns {Promise<void>}
+ */
+exports.remove = async function (archive, pathname) {
+  assert(typeof pathname === 'string', 'Remove() must be provided a valid URL string')
+  await archive.pda.unlink(pathname)
+  await crawler.crawlSite(archive)
+}
+
+// internal methods
+// =
+
+/**
+ * @param {Object} row
+ * @returns {Promise<Media>}
+ */
+async function massageMediaRow (row) {
+  if (!row) return null
+  var author = await siteDescriptions.getBest({subject: row.crawlSourceUrl})
+  if (!author) {
+    author = {
+      url: row.crawlSourceUrl,
+      title: '',
+      description: '',
+      type: [],
+      thumbUrl: `${row.crawlSourceUrl}/thumb`,
+      descAuthor: {url: null}
+    }
+  }
+  return {
+    pathname: row.pathname,
+    author,
+    subtype: row.subtype,
+    href: row.href,
+    title: row.title,
+    description: row.description,
+    tags: row.tags ? row.tags.split(',').filter(Boolean) : [],
+    createdAt: new Date(row.createdAt).toISOString(),
+    updatedAt: row.updatedAt ? new Date(row.updatedAt).toISOString() : null,
+    visibility: 'public' // TODO visibility
+  }
+}
diff --git a/dbs/profile-data-db.js b/dbs/profile-data-db.js
index d1f78311..3c1140d2 100644
--- a/dbs/profile-data-db.js
+++ b/dbs/profile-data-db.js
@@ -117,7 +117,8 @@ migrations = [
   migration('profile-data.v27.sql'),
   migration('profile-data.v28.sql'),
   migration('profile-data.v29.sql'),
-  migration('profile-data.v30.sql')
+  migration('profile-data.v30.sql'),
+  migration('profile-data.v31.sql')
 ]
 function migration (file, opts = {}) {
   return cb => {
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index e9dec02e..01c40b6f 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -267,14 +267,14 @@ CREATE VIRTUAL TABLE crawl_bookmarks_fts_index USING fts5(title, description, co
 
 -- triggers to keep crawl_bookmarks_fts_index updated
 CREATE TRIGGER crawl_bookmarks_ai AFTER INSERT ON crawl_bookmarks BEGIN
-  INSERT INTO crawl_bookmarks_fts_index(id, title, description) VALUES (new.id, new.title, new.description);
+  INSERT INTO crawl_bookmarks_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
 END;
 CREATE TRIGGER crawl_bookmarks_ad AFTER DELETE ON crawl_bookmarks BEGIN
-  INSERT INTO crawl_bookmarks_fts_index(crawl_bookmarks_fts_index, id, title, description) VALUES('delete', old.id, old.title, old.description);
+  INSERT INTO crawl_bookmarks_fts_index(crawl_bookmarks_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
 END;
 CREATE TRIGGER crawl_bookmarks_au AFTER UPDATE ON crawl_bookmarks BEGIN
-  INSERT INTO crawl_bookmarks_fts_index(crawl_bookmarks_fts_index, id, title, description) VALUES('delete', old.id, old.title, old.description);
-  INSERT INTO crawl_bookmarks_fts_index(id, title, description) VALUES (new.id, new.title, new.description);
+  INSERT INTO crawl_bookmarks_fts_index(crawl_bookmarks_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
+  INSERT INTO crawl_bookmarks_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
 END;
 
 -- crawled bookmark tags
@@ -323,6 +323,48 @@ CREATE TABLE crawl_discussions_tags (
   FOREIGN KEY (crawlTagId) REFERENCES crawl_tags (id) ON DELETE CASCADE
 );
 
+-- crawled media
+CREATE TABLE crawl_media (
+  id INTEGER PRIMARY KEY,
+  crawlSourceId INTEGER NOT NULL,
+  pathname TEXT NOT NULL,
+  crawledAt INTEGER,
+  
+  subtype TEXT NOT NULL,
+  href TEXT NOT NULL,
+  title TEXT NOT NULL,
+  description TEXT,
+  createdAt INTEGER,
+  updatedAt INTEGER,
+
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+CREATE INDEX crawl_media_url ON crawl_media (crawlSourceId, pathname);
+CREATE INDEX crawl_media_subtype ON crawl_media (subtype);
+CREATE INDEX crawl_media_href ON crawl_media (href);
+CREATE VIRTUAL TABLE crawl_media_fts_index USING fts5(title, description, content='crawl_media');
+
+-- triggers to keep crawl_media_fts_index updated
+CREATE TRIGGER crawl_media_ai AFTER INSERT ON crawl_media BEGIN
+  INSERT INTO crawl_media_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
+END;
+CREATE TRIGGER crawl_media_ad AFTER DELETE ON crawl_media BEGIN
+  INSERT INTO crawl_media_fts_index(crawl_media_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
+END;
+CREATE TRIGGER crawl_media_au AFTER UPDATE ON crawl_media BEGIN
+  INSERT INTO crawl_media_fts_index(crawl_media_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
+  INSERT INTO crawl_media_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
+END;
+
+-- crawled media tags
+CREATE TABLE crawl_media_tags (
+  crawlMediaId INTEGER,
+  crawlTagId INTEGER,
+
+  FOREIGN KEY (crawlMediaId) REFERENCES crawl_media (id) ON DELETE CASCADE,
+  FOREIGN KEY (crawlTagId) REFERENCES crawl_tags (id) ON DELETE CASCADE
+);
+
 -- a list of the draft-dats for a master-dat
 -- deprecated
 CREATE TABLE archive_drafts (
@@ -386,5 +428,5 @@ INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Library', 'beaker://library/', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker.Social', 'dat://beaker.social', 1);
 
-PRAGMA user_version = 30;
+PRAGMA user_version = 31;
 `
diff --git a/dbs/schemas/profile-data.v31.sql.js b/dbs/schemas/profile-data.v31.sql.js
new file mode 100644
index 00000000..f7eaacaa
--- /dev/null
+++ b/dbs/schemas/profile-data.v31.sql.js
@@ -0,0 +1,46 @@
+module.exports = `
+
+-- add crawled media
+CREATE TABLE crawl_media (
+  id INTEGER PRIMARY KEY,
+  crawlSourceId INTEGER NOT NULL,
+  pathname TEXT NOT NULL,
+  crawledAt INTEGER,
+  
+  subtype TEXT NOT NULL,
+  href TEXT NOT NULL,
+  title TEXT NOT NULL,
+  description TEXT,
+  createdAt INTEGER,
+  updatedAt INTEGER,
+
+  FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
+);
+CREATE INDEX crawl_media_url ON crawl_media (crawlSourceId, pathname);
+CREATE INDEX crawl_media_subtype ON crawl_media (subtype);
+CREATE INDEX crawl_media_href ON crawl_media (href);
+CREATE VIRTUAL TABLE crawl_media_fts_index USING fts5(title, description, content='crawl_media');
+
+-- triggers to keep crawl_media_fts_index updated
+CREATE TRIGGER crawl_media_ai AFTER INSERT ON crawl_media BEGIN
+  INSERT INTO crawl_media_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
+END;
+CREATE TRIGGER crawl_media_ad AFTER DELETE ON crawl_media BEGIN
+  INSERT INTO crawl_media_fts_index(crawl_media_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
+END;
+CREATE TRIGGER crawl_media_au AFTER UPDATE ON crawl_media BEGIN
+  INSERT INTO crawl_media_fts_index(crawl_media_fts_index, rowid, title, description) VALUES('delete', old.rowid, old.title, old.description);
+  INSERT INTO crawl_media_fts_index(rowid, title, description) VALUES (new.rowid, new.title, new.description);
+END;
+
+-- add crawled media tags
+CREATE TABLE crawl_media_tags (
+  crawlMediaId INTEGER,
+  crawlTagId INTEGER,
+
+  FOREIGN KEY (crawlMediaId) REFERENCES crawl_media (id) ON DELETE CASCADE,
+  FOREIGN KEY (crawlTagId) REFERENCES crawl_tags (id) ON DELETE CASCADE
+);
+
+PRAGMA user_version = 31;
+`
\ No newline at end of file
diff --git a/web-apis/bg.js b/web-apis/bg.js
index 7f59dd17..f217ee23 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -32,6 +32,7 @@ const searchManifest = require('./manifests/external/search')
 const commentsManifest = require('./manifests/external/unwalled-garden-comments')
 const discussionsManifest = require('./manifests/external/unwalled-garden-discussions')
 const followsManifest = require('./manifests/external/unwalled-garden-follows')
+const mediaManifest = require('./manifests/external/unwalled-garden-media')
 const postsManifest = require('./manifests/external/unwalled-garden-posts')
 const reactionsManifest = require('./manifests/external/unwalled-garden-reactions')
 const votesManifest = require('./manifests/external/unwalled-garden-votes')
@@ -46,6 +47,7 @@ const searchAPI = require('./bg/search')
 const commentsAPI = require('./bg/unwalled-garden-comments')
 const discussionsAPI = require('./bg/unwalled-garden-discussions')
 const followsAPI = require('./bg/unwalled-garden-follows')
+const mediaAPI = require('./bg/unwalled-garden-media')
 const postsAPI = require('./bg/unwalled-garden-posts')
 const reactionsAPI = require('./bg/unwalled-garden-reactions')
 const votesAPI = require('./bg/unwalled-garden-votes')
@@ -85,6 +87,7 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('unwalled-garden-comments', commentsManifest, commentsAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-discussions', discussionsManifest, discussionsAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-follows', followsManifest, followsAPI, secureOnly)
+  globals.rpcAPI.exportAPI('unwalled-garden-media', mediaManifest, mediaAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-posts', postsManifest, postsAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-reactions', reactionsManifest, reactionsAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-votes', votesManifest, votesAPI, secureOnly)
diff --git a/web-apis/bg/unwalled-garden-discussions.js b/web-apis/bg/unwalled-garden-discussions.js
index 8c57b7bb..a00a5db7 100644
--- a/web-apis/bg/unwalled-garden-discussions.js
+++ b/web-apis/bg/unwalled-garden-discussions.js
@@ -126,7 +126,7 @@ module.exports = {
     var userArchive = getUserArchive(this.sender)
 
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
-    assert(discussion && typeof discussion === 'object', 'The `discussion` parameter must be a string or object')
+    assert(discussion && typeof discussion === 'object', 'The `discussion` parameter must be an object')
     if ('title' in discussion) assert(discussion.title && typeof discussion.title === 'string', 'The `discussion.title` parameter must be a non-empty string')
     if ('body' in discussion) assert(typeof discussion.body === 'string', 'The `discussion.body` parameter must be a string')
     if ('href' in discussion) assert(typeof discussion.href === 'string', 'The `discussion.href` parameter must be a string')
diff --git a/web-apis/bg/unwalled-garden-media.js b/web-apis/bg/unwalled-garden-media.js
new file mode 100644
index 00000000..b48dc730
--- /dev/null
+++ b/web-apis/bg/unwalled-garden-media.js
@@ -0,0 +1,245 @@
+const globals = require('../../globals')
+const assert = require('assert')
+const {URL} = require('url')
+const {PermissionsError} = require('beaker-error-constants')
+const dat = require('../../dat')
+const mediaCrawler = require('../../crawler/media')
+
+// typedefs
+// =
+
+/**
+ * @typedef {Object} MediaAuthorPublicAPIRecord
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {string[]} type
+ *
+ * @typedef {Object} MediaPublicAPIRecord
+ * @prop {string} url
+ * @prop {string} subtype
+ * @prop {string} href
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {string[]} tags
+ * @prop {string} createdAt
+ * @prop {string} updatedAt
+ * @prop {MediaAuthorPublicAPIRecord} author
+ * @prop {string} visibility
+ */
+
+// exported api
+// =
+
+module.exports = {
+  /**
+   * @param {Object} [opts]
+   * @param {Object} [opts.filters]
+   * @param {string|string[]} [opts.filters.authors]
+   * @param {string|string[]} [opts.filters.hrefs]
+   * @param {string|string[]} [opts.filters.subtypes]
+   * @param {string|string[]} [opts.filters.tags]
+   * @param {string} [opts.filters.visibility]
+   * @param {string} [opts.sortBy]
+   * @param {number} [opts.offset=0]
+   * @param {number} [opts.limit]
+   * @param {boolean} [opts.reverse]
+   * @returns {Promise<MediaPublicAPIRecord[]>}
+   */
+  async list (opts) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    opts = (opts && typeof opts === 'object') ? opts : {}
+    if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
+    if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+    if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+    if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+    if (opts && opts.filters) {
+      if ('authors' in opts.filters) {
+        if (Array.isArray(opts.filters.authors)) {
+          assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        }
+      }
+      if ('hrefs' in opts.filters) {
+        if (Array.isArray(opts.filters.hrefs)) {
+          assert(opts.filters.hrefs.every(v => typeof v === 'string'), 'Hrefs filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.hrefs === 'string', 'Hrefs filter must be a string or array of strings')
+        }
+      }
+      if ('subtypes' in opts.filters) {
+        if (Array.isArray(opts.filters.subtypes)) {
+          assert(opts.filters.subtypes.every(v => typeof v === 'string'), 'Subtypes filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.subtypes === 'string', 'Subtypes filter must be a string or array of strings')
+        }
+      }
+      if ('tags' in opts.filters) {
+        if (Array.isArray(opts.filters.tags)) {
+          assert(opts.filters.tags.every(v => typeof v === 'string'), 'Tags filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.tags === 'string', 'Tags filter must be a string or array of strings')
+        }
+      }
+      if ('visibility' in opts.filters) {
+        assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+      }
+    }
+    var media = await mediaCrawler.list(opts)
+    return Promise.all(media.map(massageMediaRecord))
+  },
+
+  /**
+   * @param {string} url
+   * @returns {Promise<MediaPublicAPIRecord>}
+   */
+  async get (url) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    return massageMediaRecord(await mediaCrawler.get(url))
+  },
+
+  /**
+   * @param {Object} media
+   * @param {string} media.subtype
+   * @param {string} media.href
+   * @param {string} media.title
+   * @param {string} media.description
+   * @param {string[]} media.tags
+   * @param {string} media.visibility
+   * @returns {Promise<MediaPublicAPIRecord>}
+   */
+  async add (media) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    var userArchive = getUserArchive(this.sender)
+
+    assert(media && typeof media === 'object', 'The `media` parameter must be a string or object')
+    assert(media.subtype && typeof media.subtype === 'string', 'The `media.subtype` parameter must be a non-empty URL string')
+    assert(media.href && typeof media.href === 'string', 'The `media.href` parameter must be a non-empty URL string')
+    assert(media.title && typeof media.title === 'string', 'The `media.title` parameter must be a non-empty string')
+    if ('description' in media) assert(typeof media.description === 'string', 'The `media.description` parameter must be a string')
+    if ('tags' in media) assert(media.tags.every(tag => typeof tag === 'string'), 'The `media.tags` parameter must be an array of strings')
+    if ('visibility' in media) assert(typeof media.visibility === 'string', 'The `media.visibility` parameter must be "public" or "private"')
+
+    // default values
+    if (!media.visibility) {
+      media.visibility = 'public'
+    }
+
+    var url = await mediaCrawler.add(userArchive, media)
+    return massageMediaRecord(await mediaCrawler.get(url))
+  },
+
+  /**
+   * @param {string} url
+   * @param {Object} media
+   * @param {string} media.subtype
+   * @param {string} media.href
+   * @param {string} media.title
+   * @param {string} media.description
+   * @param {string[]} media.tags
+   * @param {string} media.visibility
+   * @returns {Promise<MediaPublicAPIRecord>}
+   */
+  async edit (url, media) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    var userArchive = getUserArchive(this.sender)
+
+    assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
+    assert(media && typeof media === 'object', 'The `media` parameter must be an object')
+    if ('subtype' in media) assert(typeof media.subtype === 'string', 'The `media.subtype` parameter must be a URL string')
+    if ('href' in media) assert(typeof media.href === 'string', 'The `media.href` parameter must be a URL string')
+    if ('title' in media) assert(media.title && typeof media.title === 'string', 'The `media.title` parameter must be a non-empty string')
+    if ('description' in media) assert(typeof media.description === 'string', 'The `media.description` parameter must be a string')
+    if ('tags' in media) assert(media.tags.every(tag => typeof tag === 'string'), 'The `media.tags` parameter must be an array of strings')
+    if ('visibility' in media) assert(typeof media.visibility === 'string', 'The `media.visibility` parameter must be "public" or "private"')
+
+    var filepath = await urlToFilepath(url, userArchive.url)
+    await mediaCrawler.edit(userArchive, filepath, media)
+    return massageMediaRecord(await mediaCrawler.get(userArchive.url + filepath))
+  },
+
+  /**
+   * @param {string} url
+   * @returns {Promise<void>}
+   */
+  async remove (url) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    var userArchive = getUserArchive(this.sender)
+
+    assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
+
+    var filepath = await urlToFilepath(url, userArchive.url)
+    await mediaCrawler.remove(userArchive, filepath)
+  }
+}
+
+// internal methods
+// =
+
+async function assertPermission (sender, perm) {
+  if (sender.getURL().startsWith('beaker:')) {
+    return true
+  }
+  if (await globals.permsAPI.requestPermission(perm, sender)) return true
+  throw new PermissionsError()
+}
+
+function getUserArchive (sender) {
+  var userSession = globals.userSessionAPI.getFor(sender)
+  if (!userSession) throw new Error('No active user session')
+  return dat.library.getArchive(userSession.url)
+}
+
+/**
+ * Tries to parse the URL and return the pathname. If fails, assumes the string was a pathname.
+ * @param {string} url
+ * @returns {Promise<string>}
+ */
+async function urlToFilepath (url, origin) {
+  var urlp
+  var filepath
+  try {
+    // if `url` is a full URL, extract the path
+    urlp = new URL(url)
+    filepath = urlp.pathname
+  } catch (e) {
+    // assume `url` is a path
+    return url
+  }
+
+  // double-check the origin
+  var key = await dat.dns.resolveName(urlp.hostname)
+  var urlp2 = new URL(origin)
+  if (key !== urlp2.hostname) {
+    throw new Error('Unable to edit media on other sites than your own')
+  }
+
+  return filepath
+}
+
+/**
+ * @param {Object} media
+ * @returns {MediaPublicAPIRecord}
+ */
+function massageMediaRecord (media) {
+  if (!media) return null
+  var url =  media.author.url + media.pathname
+  return {
+    url,
+    subtype: media.subtype,
+    href: media.href,
+    title: media.title,
+    description: media.description,
+    tags: media.tags,
+    createdAt: media.createdAt,
+    updatedAt: media.updatedAt,
+    author: {
+      url: media.author.url,
+      title: media.author.title,
+      description: media.author.description,
+      type: media.author.type
+    },
+    visibility: media.visibility
+  }
+}
diff --git a/web-apis/fg/navigator-import.js b/web-apis/fg/navigator-import.js
index 7623b275..8cf26cf3 100644
--- a/web-apis/fg/navigator-import.js
+++ b/web-apis/fg/navigator-import.js
@@ -40,6 +40,10 @@ const APIs = {
     manifest: require('../manifests/external/unwalled-garden-follows'),
     create: makeCreateFn('unwalled-garden-follows')
   },
+  'unwalled-garden-media': {
+    manifest: require('../manifests/external/unwalled-garden-media'),
+    create: makeCreateFn('unwalled-garden-media')
+  },
   'unwalled-garden-posts': {
     manifest: require('../manifests/external/unwalled-garden-posts'),
     create: makeCreateFn('unwalled-garden-posts')
diff --git a/web-apis/manifests/external/unwalled-garden-media.js b/web-apis/manifests/external/unwalled-garden-media.js
new file mode 100644
index 00000000..06aeb28a
--- /dev/null
+++ b/web-apis/manifests/external/unwalled-garden-media.js
@@ -0,0 +1,7 @@
+module.exports = {
+  list: 'promise',
+  get: 'promise',
+  add: 'promise',
+  edit: 'promise',
+  remove: 'promise'
+}
\ No newline at end of file

From 73bad49eaebabcc8337adf8f0e6451449e466774 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 18 Jun 2019 12:42:52 -0500
Subject: [PATCH 189/245] Add missing pragma

---
 dbs/sitedata.js | 1 +
 1 file changed, 1 insertion(+)

diff --git a/dbs/sitedata.js b/dbs/sitedata.js
index f8adb2bb..2799eaf2 100644
--- a/dbs/sitedata.js
+++ b/dbs/sitedata.js
@@ -312,6 +312,7 @@ migrations = [
     db.exec(`
       -- beaker.social
       INSERT OR REPLACE INTO "sitedata" VALUES('dat:b3c82a26487167c276dc8539dcec97f52a95c8231bc2d41d28886ed36184d3b1','favicon','data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAABAAAAAQCAYAAAAf8/9hAAAAjUlEQVR4Ac3BoQ0CQRCG0e/fG0UDJEs3WBw14KEVPDXgsBhquQs0gLsMKyasHYKA9/g5EXaX5whUcqbTZrGiKXSVvEoodDN5M8EIjq+FlmS43wnGm7ZAJUOagBuNEQR7PnOgKXzJ6I5AJcN9JBjB8bPQkgQXD4IRhK7AQILQDBhNoRvIGwiFbiJv5G+8ABIEG1xwcZ4JAAAAAElFTkSuQmCC');
+      PRAGMA user_version = 6;
     `, cb)
   }
 ]

From 0fa849a807130fdd44e31fe8f785648b8cb50f1e Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 18 Jun 2019 12:43:19 -0500
Subject: [PATCH 190/245] Add discussions FTS

---
 dbs/profile-data-db.js              |  3 ++-
 dbs/schemas/profile-data.sql.js     | 15 ++++++++++++++-
 dbs/schemas/profile-data.v32.sql.js | 19 +++++++++++++++++++
 3 files changed, 35 insertions(+), 2 deletions(-)
 create mode 100644 dbs/schemas/profile-data.v32.sql.js

diff --git a/dbs/profile-data-db.js b/dbs/profile-data-db.js
index 3c1140d2..3ec3ed3b 100644
--- a/dbs/profile-data-db.js
+++ b/dbs/profile-data-db.js
@@ -118,7 +118,8 @@ migrations = [
   migration('profile-data.v28.sql'),
   migration('profile-data.v29.sql'),
   migration('profile-data.v30.sql'),
-  migration('profile-data.v31.sql')
+  migration('profile-data.v31.sql'),
+  migration('profile-data.v32.sql')
 ]
 function migration (file, opts = {}) {
   return cb => {
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index 01c40b6f..aa70c464 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -313,6 +313,19 @@ CREATE TABLE crawl_discussions (
   FOREIGN KEY (crawlSourceId) REFERENCES crawl_sources (id) ON DELETE CASCADE
 );
 CREATE INDEX crawl_discussions_url ON crawl_discussions (crawlSourceId, pathname);
+CREATE VIRTUAL TABLE crawl_discussions_fts_index USING fts5(title, body, content='crawl_discussions');
+
+-- triggers to keep crawl_discussions_fts_index updated
+CREATE TRIGGER crawl_discussions_ai AFTER INSERT ON crawl_discussions BEGIN
+  INSERT INTO crawl_discussions_fts_index(rowid, title, body) VALUES (new.rowid, new.title, new.body);
+END;
+CREATE TRIGGER crawl_discussions_ad AFTER DELETE ON crawl_discussions BEGIN
+  INSERT INTO crawl_discussions_fts_index(crawl_discussions_fts_index, rowid, title, body) VALUES('delete', old.rowid, old.title, old.body);
+END;
+CREATE TRIGGER crawl_discussions_au AFTER UPDATE ON crawl_discussions BEGIN
+  INSERT INTO crawl_discussions_fts_index(crawl_discussions_fts_index, rowid, title, body) VALUES('delete', old.rowid, old.title, old.body);
+  INSERT INTO crawl_discussions_fts_index(rowid, title, body) VALUES (new.rowid, new.title, new.body);
+END;
 
 -- crawled discussion tags
 CREATE TABLE crawl_discussions_tags (
@@ -428,5 +441,5 @@ INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Library', 'beaker://library/', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker.Social', 'dat://beaker.social', 1);
 
-PRAGMA user_version = 31;
+PRAGMA user_version = 32;
 `
diff --git a/dbs/schemas/profile-data.v32.sql.js b/dbs/schemas/profile-data.v32.sql.js
new file mode 100644
index 00000000..022ddd39
--- /dev/null
+++ b/dbs/schemas/profile-data.v32.sql.js
@@ -0,0 +1,19 @@
+module.exports = `
+
+CREATE VIRTUAL TABLE crawl_discussions_fts_index USING fts5(title, body, content='crawl_discussions');
+
+-- triggers to keep crawl_discussions_fts_index updated
+CREATE TRIGGER crawl_discussions_ai AFTER INSERT ON crawl_discussions BEGIN
+  INSERT INTO crawl_discussions_fts_index(rowid, title, body) VALUES (new.rowid, new.title, new.body);
+END;
+CREATE TRIGGER crawl_discussions_ad AFTER DELETE ON crawl_discussions BEGIN
+  INSERT INTO crawl_discussions_fts_index(crawl_discussions_fts_index, rowid, title, body) VALUES('delete', old.rowid, old.title, old.body);
+END;
+CREATE TRIGGER crawl_discussions_au AFTER UPDATE ON crawl_discussions BEGIN
+  INSERT INTO crawl_discussions_fts_index(crawl_discussions_fts_index, rowid, title, body) VALUES('delete', old.rowid, old.title, old.body);
+  INSERT INTO crawl_discussions_fts_index(rowid, title, body) VALUES (new.rowid, new.title, new.body);
+END;
+
+PRAGMA user_version = 32;
+
+`
\ No newline at end of file

From 71358460322e6bfc5e00691d0847260bfefb3d0b Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 18 Jun 2019 13:33:22 -0500
Subject: [PATCH 191/245] Normalize URLs read by crawler

---
 crawler/bookmarks.js |  7 ++++---
 crawler/comments.js  | 20 +++++++++++++-------
 crawler/media.js     |  8 +++++---
 crawler/reactions.js | 14 +++++---------
 crawler/util.js      | 24 ++++++++++++++++++++++++
 crawler/votes.js     | 10 +---------
 6 files changed, 52 insertions(+), 31 deletions(-)

diff --git a/crawler/bookmarks.js b/crawler/bookmarks.js
index 9628f114..60c38077 100644
--- a/crawler/bookmarks.js
+++ b/crawler/bookmarks.js
@@ -7,7 +7,7 @@ const db = require('../dbs/profile-data-db')
 const knex = require('../lib/knex')
 const crawler = require('./index')
 const siteDescriptions = require('./site-descriptions')
-const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename, ensureDirectory} = require('./util')
+const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename, normalizeTopicUrl, ensureDirectory} = require('./util')
 const bookmarkSchema = require('./json-schemas/bookmark')
 
 // constants
@@ -116,6 +116,7 @@ exports.crawlSite = async function (archive, crawlSource) {
         }
 
         // massage the bookmark
+        bookmark.href = normalizeTopicUrl(bookmark.href)
         bookmark.createdAt = Number(new Date(bookmark.createdAt))
         bookmark.updatedAt = Number(new Date(bookmark.updatedAt))
         if (isNaN(bookmark.updatedAt)) bookmark.updatedAt = 0 // optional
@@ -261,7 +262,7 @@ exports.addBookmark = async function (archive, bookmark) {
 
   var bookmarkObject = {
     type: JSON_TYPE,
-    href: bookmark.href,
+    href: normalizeTopicUrl(bookmark.href),
     title: bookmark.title,
     description: bookmark.description,
     tags: bookmark.tags,
@@ -299,7 +300,7 @@ exports.editBookmark = async function (archive, pathname, bookmark) {
 
   var bookmarkObject = {
     type: JSON_TYPE,
-    href: bookmark.href ? bookmark.href : existingBookmark.title,
+    href: bookmark.href ? normalizeTopicUrl(bookmark.href) : existingBookmark.title,
     title: ('title' in bookmark) ? bookmark.title : existingBookmark.title,
     description: ('description' in bookmark) ? bookmark.description : existingBookmark.description,
     tags: ('tags' in bookmark) ? bookmark.tags : existingBookmark.tags,
diff --git a/crawler/comments.js b/crawler/comments.js
index e5859d94..6319438e 100644
--- a/crawler/comments.js
+++ b/crawler/comments.js
@@ -8,7 +8,7 @@ const crawler = require('./index')
 const lock = require('../lib/lock')
 const knex = require('../lib/knex')
 const siteDescriptions = require('./site-descriptions')
-const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename, ensureDirectory, toOrigin} = require('./util')
+const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename, ensureDirectory, normalizeTopicUrl, toOrigin} = require('./util')
 const commentSchema = require('./json-schemas/comment')
 
 // constants
@@ -128,7 +128,8 @@ exports.crawlSite = async function (archive, crawlSource) {
         }
 
         // massage the comment
-        comment.repliesTo = comment.repliesTo || ''
+        comment.topic = normalizeTopicUrl(comment.topic)
+        comment.repliesTo = comment.repliesTo ? normalizeTopicUrl(comment.repliesTo) : ''
         comment.createdAt = Number(new Date(comment.createdAt))
         comment.updatedAt = Number(new Date(comment.updatedAt))
         if (isNaN(comment.updatedAt)) comment.updatedAt = 0 // optional
@@ -200,6 +201,7 @@ exports.list = async function (opts) {
         assert(typeof opts.filters.topics === 'string', 'Topics filter must be a string or array of strings')
         opts.filters.topics = [opts.filters.topics]
       }
+      opts.filters.topics = opts.filters.topics.map(normalizeTopicUrl)
     }
     if ('visibility' in opts.filters) {
       assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
@@ -246,7 +248,11 @@ exports.thread = async function (topic, opts) {
 
   // validate & parse params
   assert(typeof topic === 'string', 'Topic must be a URL string')
-  if (opts && 'parent' in opts) assert(typeof opts.parent === 'string', 'Parent must be a string')
+  topic = normalizeTopicUrl(topic)
+  if (opts && 'parent' in opts) {
+    assert(typeof opts.parent === 'string', 'Parent must be a string')
+    opts.parent = normalizeTopicUrl(opts.parent)
+  }
   if (opts && 'depth' in opts) assert(typeof opts.depth === 'number', 'Depth must be a number')
   if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
   if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
@@ -375,8 +381,8 @@ exports.add = async function (archive, topic, comment) {
 
   var commentObject = {
     type: JSON_TYPE,
-    topic,
-    replyTo: comment.replyTo,
+    topic: normalizeTopicUrl(topic),
+    replyTo: comment.replyTo ? normalizeTopicUrl(comment.replyTo) : undefined,
     body: comment.body,
     createdAt: (new Date()).toISOString()
   }
@@ -416,8 +422,8 @@ exports.edit = async function (archive, pathname, comment) {
     // update comment content
     var commentObject = {
       type: JSON_TYPE,
-      topic: existingComment.topic,
-      replyTo: ('replyTo' in comment) ? comment.replyTo : existingComment.replyTo,
+      topic: normalizeTopicUrl(existingComment.topic),
+      replyTo: ('replyTo' in comment) ? normalizeTopicUrl(comment.replyTo) : existingComment.replyTo,
       body: ('body' in comment) ? comment.body : existingComment.body,
       createdAt: existingComment.createdAt,
       updatedAt: (new Date()).toISOString()
diff --git a/crawler/media.js b/crawler/media.js
index 41b53932..11f351b8 100644
--- a/crawler/media.js
+++ b/crawler/media.js
@@ -8,7 +8,7 @@ const crawler = require('./index')
 const lock = require('../lib/lock')
 const knex = require('../lib/knex')
 const siteDescriptions = require('./site-descriptions')
-const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename, ensureDirectory, toOrigin} = require('./util')
+const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename, ensureDirectory, normalizeSchemaUrl, toOrigin} = require('./util')
 const mediaSchema = require('./json-schemas/media')
 
 // constants
@@ -118,6 +118,7 @@ exports.crawlSite = async function (archive, crawlSource) {
         }
 
         // massage the media
+        media.subtype = normalizeSchemaUrl(media.subtype)
         media.createdAt = Number(new Date(media.createdAt))
         media.updatedAt = Number(new Date(media.updatedAt))
         if (!media.description) media.description = '' // optional
@@ -234,6 +235,7 @@ exports.list = async function (opts) {
         assert(typeof opts.filters.subtypes === 'string', 'Subtypes filter must be a string or array of strings')
         opts.filters.subtypes = [opts.filters.subtypes]
       }
+      opts.filters.subtypes = opts.filters.subtypes.map(normalizeSchemaUrl)
     }
     if ('tags' in opts.filters) {
       if (Array.isArray(opts.filters.tags)) {
@@ -327,7 +329,7 @@ exports.add = async function (archive, media) {
 
   var mediaObject = {
     type: JSON_TYPE,
-    subtype: media.subtype,
+    subtype: normalizeSchemaUrl(media.subtype),
     href: media.href,
     title: media.title,
     description: media.description,
@@ -373,7 +375,7 @@ exports.edit = async function (archive, pathname, media) {
     // update media content
     var mediaObject = {
       type: JSON_TYPE,
-      subtype: ('subtype' in media) ? media.subtype : existingMedia.subtype,
+      subtype: normalizeSchemaUrl(('subtype' in media) ? media.subtype : existingMedia.subtype),
       href: ('href' in media) ? media.href : existingMedia.href,
       title: ('title' in media) ? media.title : existingMedia.title,
       description: ('description' in media) ? media.description : existingMedia.description,
diff --git a/crawler/reactions.js b/crawler/reactions.js
index 4a823d65..0cdfdc54 100644
--- a/crawler/reactions.js
+++ b/crawler/reactions.js
@@ -7,7 +7,7 @@ const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
 const lock = require('../lib/lock')
 const knex = require('../lib/knex')
-const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, ensureDirectory, toOrigin, slugifyUrl} = require('./util')
+const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, ensureDirectory, toOrigin, normalizeTopicUrl, slugifyUrl} = require('./util')
 const reactionSchema = require('./json-schemas/reaction')
 
 // constants
@@ -174,6 +174,7 @@ exports.list = async function (opts) {
         assert(typeof opts.filters.topics === 'string', 'Topics filter must be a string or array of strings')
         opts.filters.topics = [opts.filters.topics]
       }
+      opts.filters.topics = opts.filters.topics.map(normalizeTopicUrl)
     }
     if ('visibility' in opts.filters) {
       assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
@@ -221,6 +222,7 @@ exports.tabulate = async function (topic, opts) {
   // validate params
   try { new URL(topic) }
   catch (e) { throw new Error('Invalid URL: ' + topic) }
+  topic = normalizeTopicUrl(topic)
   if (opts && opts.filters) {
     if ('authors' in opts.filters) {
       if (Array.isArray(opts.filters.authors)) {
@@ -274,6 +276,7 @@ exports.tabulate = async function (topic, opts) {
 exports.add = async function (archive, topic, emoji) {
   // TODO handle visibility
 
+  topic = normalizeTopicUrl(topic)
   emoji = emoji.replace('\uFE0F', '').replace('\uFE0E', '') // strip the emoji-enforcement token
   var valid = validateReaction({type: JSON_TYPE, topic, emojis: [emoji]})
   if (!valid) throw ajv.errorsText(validateReaction.errors)
@@ -297,6 +300,7 @@ exports.add = async function (archive, topic, emoji) {
 exports.remove = async function (archive, topic, emoji) {
   // TODO handle visibility
 
+  topic = normalizeTopicUrl(topic)
   emoji = emoji.replace('\uFE0F', '').replace('\uFE0E', '') // strip the emoji-enforcement token
   var valid = validateReaction({type: JSON_TYPE, topic, emojis: [emoji]})
   if (!valid) throw ajv.errorsText(validateReaction.errors)
@@ -309,14 +313,6 @@ exports.remove = async function (archive, topic, emoji) {
 // internal methods
 // =
 
-function normalizeTopicUrl (url) {
-  try {
-    url = new URL(url)
-    return (url.protocol + '//' + url.hostname + url.pathname + url.search + url.hash).replace(/([/]$)/g, '')
-  } catch (e) {}
-  return null
-}
-
 /**
  * @param {InternalDatArchive} archive
  * @param {string} pathname
diff --git a/crawler/util.js b/crawler/util.js
index 41ab99ae..8acf24cd 100644
--- a/crawler/util.js
+++ b/crawler/util.js
@@ -158,6 +158,30 @@ exports.toOrigin = function (url, shouldThrow = false) {
   }
 }
 
+/**
+ * @param {string} url
+ * @returns {string}
+ */
+exports.normalizeTopicUrl = function (url) {
+  try {
+    var urlp = new URL(url)
+    return (urlp.protocol + '//' + urlp.hostname + urlp.pathname + urlp.search + urlp.hash).replace(/([/]$)/g, '')
+  } catch (e) {}
+  return null
+}
+
+/**
+ * @param {string} url
+ * @returns {string}
+ */
+exports.normalizeSchemaUrl = function (url) {
+  try {
+    var urlp = new URL(url)
+    return (urlp.hostname + urlp.pathname + urlp.search + urlp.hash).replace(/([/]$)/g, '')
+  } catch (e) {}
+  return null
+}
+
 /**
  * @param {InternalDatArchive} archive
  * @param {string} pathname
diff --git a/crawler/votes.js b/crawler/votes.js
index dbab21a4..5c47b9ae 100644
--- a/crawler/votes.js
+++ b/crawler/votes.js
@@ -7,7 +7,7 @@ const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
 const knex = require('../lib/knex')
 const siteDescriptions = require('./site-descriptions')
-const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, ensureDirectory, toOrigin, generateTimeFilename} = require('./util')
+const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, ensureDirectory, toOrigin, normalizeTopicUrl, generateTimeFilename} = require('./util')
 const voteSchema = require('./json-schemas/vote')
 
 // constants
@@ -345,14 +345,6 @@ exports.set = async function (archive, topic, vote) {
 // internal methods
 // =
 
-function normalizeTopicUrl (url) {
-  try {
-    url = new URL(url)
-    return (url.protocol + '//' + url.hostname + url.pathname + url.search + url.hash).replace(/([/]$)/g, '')
-  } catch (e) {}
-  return null
-}
-
 /**
  * @param {Object} row
  * @returns {Promise<Vote>}

From e6484a7259a5d9062d9f54b94574b7994444855f Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 24 Jun 2019 20:16:01 -0500
Subject: [PATCH 192/245] Add unwalled-garden-tags web api

---
 crawler/tags.js                               | 217 ++++++++++++++++++
 crawler/util.js                               |   2 +-
 web-apis/bg.js                                |   3 +
 web-apis/bg/unwalled-garden-follows.js        |  45 ++--
 web-apis/bg/unwalled-garden-tags.js           | 153 ++++++++++++
 web-apis/fg/navigator-import.js               |   4 +
 .../external/unwalled-garden-tags.js          |   5 +
 7 files changed, 406 insertions(+), 23 deletions(-)
 create mode 100644 crawler/tags.js
 create mode 100644 web-apis/bg/unwalled-garden-tags.js
 create mode 100644 web-apis/manifests/external/unwalled-garden-tags.js

diff --git a/crawler/tags.js b/crawler/tags.js
new file mode 100644
index 00000000..1da8c5dc
--- /dev/null
+++ b/crawler/tags.js
@@ -0,0 +1,217 @@
+const assert = require('assert')
+const {URL} = require('url')
+const db = require('../dbs/profile-data-db')
+const knex = require('../lib/knex')
+const {normalizeSchemaUrl, toOrigin} = require('./util')
+
+// typedefs
+// =
+
+/**
+ * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
+ * @typedef {import('./util').CrawlSourceRecord} CrawlSourceRecord
+ * @typedef { import("./site-descriptions").SiteDescription } SiteDescription
+ *
+ * @typedef {Object} Tag
+ * @prop {string} tag
+ * @prop {number} count
+ */
+
+// exported api
+// =
+
+/**
+ * @description
+ * List bookmark tags.
+ *
+ * @param {Object} [opts]
+ * @param {Object} [opts.filters]
+ * @param {string|string[]} [opts.filters.authors]
+ * @param {string} [opts.filters.visibility]
+ * @param {string} [opts.sortBy]
+ * @param {number} [opts.offset=0]
+ * @param {number} [opts.limit]
+ * @param {boolean} [opts.reverse]
+ * @returns {Promise<Array<Tag>>}
+ */
+exports.listBookmarkTags = async function (opts) {
+  // TODO: handle visibility
+  // TODO: sortBy options
+
+  // validate & parse params
+  if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
+  if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+  if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+  if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+  if (opts && opts.filters) {
+    if ('authors' in opts.filters) {
+      if (Array.isArray(opts.filters.authors)) {
+        assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        opts.filters.authors = [opts.filters.authors]
+      }
+      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+    }
+    if ('visibility' in opts.filters) {
+      assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+    }
+  }
+
+  // build query
+  var sql = knex('crawl_tags')
+    .select('crawl_tags.tag')
+    .select(knex.raw('count(crawl_tags.id) as count'))
+    .innerJoin('crawl_bookmarks_tags', 'crawl_bookmarks_tags.crawlTagId', '=', 'crawl_tags.id')
+    .innerJoin('crawl_bookmarks', 'crawl_bookmarks_tags.crawlBookmarkId', '=', 'crawl_bookmarks.id')
+    .leftJoin('crawl_sources', 'crawl_bookmarks.crawlSourceId', '=', 'crawl_sources.id')
+    .orderBy('crawl_tags.tag', opts.reverse ? 'DESC' : 'ASC')
+    .groupBy('crawl_tags.tag')
+  if (opts && opts.filters && opts.filters.authors) {
+    sql = sql.whereIn('crawl_sources.url', opts.filters.authors)
+  }
+  if (opts && opts.limit) sql = sql.limit(opts.limit)
+  if (opts && opts.offset) sql = sql.offset(opts.offset)
+
+  // execute query
+  var rows = await db.all(sql)
+  return rows.map(row => ({
+    tag: row.tag,
+    count: +row.count
+  }))
+}
+
+/**
+ * @description
+ * List discussion tags.
+ *
+ * @param {Object} [opts]
+ * @param {Object} [opts.filters]
+ * @param {string|string[]} [opts.filters.authors]
+ * @param {string} [opts.filters.visibility]
+ * @param {string} [opts.sortBy]
+ * @param {number} [opts.offset=0]
+ * @param {number} [opts.limit]
+ * @param {boolean} [opts.reverse]
+ * @returns {Promise<Array<Tag>>}
+ */
+exports.listDiscussionTags = async function (opts) {
+  // TODO: handle visibility
+  // TODO: sortBy options
+
+  // validate & parse params
+  if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
+  if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+  if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+  if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+  if (opts && opts.filters) {
+    if ('authors' in opts.filters) {
+      if (Array.isArray(opts.filters.authors)) {
+        assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        opts.filters.authors = [opts.filters.authors]
+      }
+      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+    }
+    if ('visibility' in opts.filters) {
+      assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+    }
+  }
+
+  // build query
+  var sql = knex('crawl_tags')
+    .select('crawl_tags.tag')
+    .select(knex.raw('count(crawl_tags.id) as count'))
+    .innerJoin('crawl_discussions_tags', 'crawl_discussions_tags.crawlTagId', '=', 'crawl_tags.id')
+    .innerJoin('crawl_discussions', 'crawl_discussions_tags.crawlDiscussionId', '=', 'crawl_discussions.id')
+    .leftJoin('crawl_sources', 'crawl_discussions.crawlSourceId', '=', 'crawl_sources.id')
+    .orderBy('crawl_tags.tag', opts.reverse ? 'DESC' : 'ASC')
+    .groupBy('crawl_tags.tag')
+  if (opts && opts.filters && opts.filters.authors) {
+    sql = sql.whereIn('crawl_sources.url', opts.filters.authors)
+  }
+  if (opts && opts.limit) sql = sql.limit(opts.limit)
+  if (opts && opts.offset) sql = sql.offset(opts.offset)
+
+  // execute query
+  var rows = await db.all(sql)
+  return rows.map(row => ({
+    tag: row.tag,
+    count: +row.count
+  }))
+}
+
+/**
+ * @description
+ * List media tags.
+ *
+ * @param {Object} [opts]
+ * @param {Object} [opts.filters]
+ * @param {string|string[]} [opts.filters.authors]
+ * @param {string|string[]} [opts.filters.subtypes]
+ * @param {string} [opts.filters.visibility]
+ * @param {string} [opts.sortBy]
+ * @param {number} [opts.offset=0]
+ * @param {number} [opts.limit]
+ * @param {boolean} [opts.reverse]
+ * @returns {Promise<Array<Tag>>}
+ */
+exports.listMediaTags = async function (opts) {
+  // TODO: handle visibility
+  // TODO: sortBy options
+
+  // validate & parse params
+  if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
+  if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+  if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+  if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+  if (opts && opts.filters) {
+    if ('authors' in opts.filters) {
+      if (Array.isArray(opts.filters.authors)) {
+        assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        opts.filters.authors = [opts.filters.authors]
+      }
+      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+    }
+    if ('subtypes' in opts.filters) {
+      if (Array.isArray(opts.filters.subtypes)) {
+        assert(opts.filters.subtypes.every(v => typeof v === 'string'), 'Subtypes filter must be a string or array of strings')
+      } else {
+        assert(typeof opts.filters.subtypes === 'string', 'Subtypes filter must be a string or array of strings')
+        opts.filters.subtypes = [opts.filters.subtypes]
+      }
+      opts.filters.subtypes = opts.filters.subtypes.map(normalizeSchemaUrl)
+    }
+    if ('visibility' in opts.filters) {
+      assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+    }
+  }
+
+  // build query
+  var sql = knex('crawl_tags')
+    .select('crawl_tags.tag')
+    .select(knex.raw('count(crawl_tags.id) as count'))
+    .innerJoin('crawl_media_tags', 'crawl_media_tags.crawlTagId', '=', 'crawl_tags.id')
+    .innerJoin('crawl_media', 'crawl_media_tags.crawlMediaId', '=', 'crawl_media.id')
+    .leftJoin('crawl_sources', 'crawl_media.crawlSourceId', '=', 'crawl_sources.id')
+    .orderBy('crawl_tags.tag', opts.reverse ? 'DESC' : 'ASC')
+    .groupBy('crawl_tags.tag')
+  if (opts && opts.filters && opts.filters.authors) {
+    sql = sql.whereIn('crawl_sources.url', opts.filters.authors)
+  }
+  if (opts && opts.filters && opts.filters.subtypes) {
+    sql = sql.whereIn('crawl_media.subtype', opts.filters.subtypes)
+  }
+  if (opts && opts.limit) sql = sql.limit(opts.limit)
+  if (opts && opts.offset) sql = sql.offset(opts.offset)
+
+  // execute query
+  var rows = await db.all(sql)
+  return rows.map(row => ({
+    tag: row.tag,
+    count: +row.count
+  }))
+}
\ No newline at end of file
diff --git a/crawler/util.js b/crawler/util.js
index 8acf24cd..6c538bdf 100644
--- a/crawler/util.js
+++ b/crawler/util.js
@@ -179,7 +179,7 @@ exports.normalizeSchemaUrl = function (url) {
     var urlp = new URL(url)
     return (urlp.hostname + urlp.pathname + urlp.search + urlp.hash).replace(/([/]$)/g, '')
   } catch (e) {}
-  return null
+  return url
 }
 
 /**
diff --git a/web-apis/bg.js b/web-apis/bg.js
index f217ee23..12a2835d 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -35,6 +35,7 @@ const followsManifest = require('./manifests/external/unwalled-garden-follows')
 const mediaManifest = require('./manifests/external/unwalled-garden-media')
 const postsManifest = require('./manifests/external/unwalled-garden-posts')
 const reactionsManifest = require('./manifests/external/unwalled-garden-reactions')
+const tagsManifest = require('./manifests/external/unwalled-garden-tags')
 const votesManifest = require('./manifests/external/unwalled-garden-votes')
 
 // external apis
@@ -50,6 +51,7 @@ const followsAPI = require('./bg/unwalled-garden-follows')
 const mediaAPI = require('./bg/unwalled-garden-media')
 const postsAPI = require('./bg/unwalled-garden-posts')
 const reactionsAPI = require('./bg/unwalled-garden-reactions')
+const tagsAPI = require('./bg/unwalled-garden-tags')
 const votesAPI = require('./bg/unwalled-garden-votes')
 
 // experimental manifests
@@ -90,6 +92,7 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('unwalled-garden-media', mediaManifest, mediaAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-posts', postsManifest, postsAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-reactions', reactionsManifest, reactionsAPI, secureOnly)
+  globals.rpcAPI.exportAPI('unwalled-garden-tags', tagsManifest, tagsAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-votes', votesManifest, votesAPI, secureOnly)
 
   // experimental apis
diff --git a/web-apis/bg/unwalled-garden-follows.js b/web-apis/bg/unwalled-garden-follows.js
index 0a820b2c..3a97b0de 100644
--- a/web-apis/bg/unwalled-garden-follows.js
+++ b/web-apis/bg/unwalled-garden-follows.js
@@ -17,7 +17,7 @@ const followsCrawler = require('../../crawler/follows')
  *
  * @typedef {Object} FollowsPublicAPIRecord
  * @prop {FollowsSitePublicAPIRecord} author
- * @prop {FollowsSitePublicAPIRecord} subject
+ * @prop {FollowsSitePublicAPIRecord} topic
  * @prop {string} visibility
  */
 
@@ -69,71 +69,71 @@ module.exports = {
 
   /**
    * @param {string} author
-   * @param {string} subject
+   * @param {string} topic
    * @returns {Promise<FollowsPublicAPIRecord>}
    */
-  async get (author, subject) {
+  async get (author, topic) {
     await assertPermission(this.sender, 'dangerousAppControl')
 
     author = normalizeFollowUrl(author)
-    subject = normalizeFollowUrl(subject)
+    topic = normalizeFollowUrl(topic)
 
     assert(author, 'The `author` parameter must be a valid URL')
-    assert(subject, 'The `subject` parameter must be a valid URL')
+    assert(topic, 'The `topic` parameter must be a valid URL')
 
-    return followsCrawler.get(author, subject)
+    return followsCrawler.get(author, topic)
   },
 
   /**
-   * @param {string} subject
+   * @param {string} topic
    * @param {Object} [opts]
    * @param {string} [opts.visibility]
    * @returns {Promise<void>}
    */
-  async add (subject, opts) {
+  async add (topic, opts) {
     await assertPermission(this.sender, 'dangerousAppControl')
     var userArchive = getUserArchive(this.sender)
 
-    subject = normalizeFollowUrl(subject)
+    topic = normalizeFollowUrl(topic)
     if (!opts) opts = {}
     if (!opts.visibility) opts.visibility = 'public'
-    assert(subject, 'The `subject` parameter must be a valid URL')
+    assert(topic, 'The `topic` parameter must be a valid URL')
     assert(['public', 'private'].includes(opts.visibility), 'The `visibility` parameter must be "public" or "private"')
 
-    await followsCrawler.add(userArchive, subject, opts)
+    await followsCrawler.add(userArchive, topic, opts)
   },
 
   /**
-   * @param {string} subject
+   * @param {string} topic
    * @param {Object} [opts]
    * @param {string} [opts.visibility]
    * @returns {Promise<void>}
    */
-  async edit (subject, opts) {
+  async edit (topic, opts) {
     await assertPermission(this.sender, 'dangerousAppControl')
     var userArchive = getUserArchive(this.sender)
 
-    subject = normalizeFollowUrl(subject)
+    topic = normalizeFollowUrl(topic)
     if (!opts) opts = {}
     if (!opts.visibility) opts.visibility = 'public'
-    assert(subject, 'The `subject` parameter must be a valid URL')
+    assert(topic, 'The `topic` parameter must be a valid URL')
     assert(['public', 'private'].includes(opts.visibility), 'The `visibility` parameter must be "public" or "private"')
 
-    await followsCrawler.edit(userArchive, subject, opts)
+    await followsCrawler.edit(userArchive, topic, opts)
   },
 
   /**
-   * @param {string} subject
+   * @param {string} topic
    * @returns {Promise<void>}
    */
-  async remove (subject) {
+  async remove (topic) {
     await assertPermission(this.sender, 'dangerousAppControl')
     var userArchive = getUserArchive(this.sender)
 
-    subject = normalizeFollowUrl(subject)
-    assert(subject, 'The `subject` parameter must be a valid URL')
+    topic = normalizeFollowUrl(topic)
+    assert(topic, 'The `topic` parameter must be a valid URL')
 
-    await followsCrawler.remove(userArchive, subject)
+    await followsCrawler.remove(userArchive, topic)
   }
 }
 
@@ -171,6 +171,7 @@ function normalizeFollowUrl (url) {
  * @returns {FollowsSitePublicAPIRecord}
  */
 function massageSiteRecord (site) {
+  if (!site) return null
   return {
     url: site.url,
     title: site.title,
@@ -186,7 +187,7 @@ function massageSiteRecord (site) {
 function massageFollowRecord (follow) {
   return {
     author: massageSiteRecord(follow.author),
-    subject: massageSiteRecord(follow.subject),
+    topic: massageSiteRecord(follow.topic),
     visibility: follow.visibility
   }
 }
\ No newline at end of file
diff --git a/web-apis/bg/unwalled-garden-tags.js b/web-apis/bg/unwalled-garden-tags.js
new file mode 100644
index 00000000..c6048f77
--- /dev/null
+++ b/web-apis/bg/unwalled-garden-tags.js
@@ -0,0 +1,153 @@
+const globals = require('../../globals')
+const assert = require('assert')
+const {PermissionsError} = require('beaker-error-constants')
+const tagsCrawler = require('../../crawler/tags')
+
+// typedefs
+// =
+
+/**
+ * @typedef {import('../../crawler/tags').Tag} Tag
+ *
+ * @typedef {Object} TagPublicAPIRecord
+ * @prop {string} tag
+ * @prop {number} count
+ */
+
+// exported api
+// =
+
+module.exports = {
+  /**
+   * @param {Object} [opts]
+   * @param {Object} [opts.filters]
+   * @param {string|string[]} [opts.filters.authors]
+   * @param {string} [opts.filters.visibility]
+   * @param {string} [opts.sortBy]
+   * @param {number} [opts.offset=0]
+   * @param {number} [opts.limit]
+   * @param {boolean} [opts.reverse]
+   * @returns {Promise<TagPublicAPIRecord[]>}
+   */
+  async listBookmarkTags (opts) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    opts = (opts && typeof opts === 'object') ? opts : {}
+    if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
+    if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+    if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+    if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+    if (opts && opts.filters) {
+      if ('authors' in opts.filters) {
+        if (Array.isArray(opts.filters.authors)) {
+          assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        }
+      }
+      if ('visibility' in opts.filters) {
+        assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+      }
+    }
+    var tags = await tagsCrawler.listBookmarkTags(opts)
+    return tags.map(massageTagRecord)
+  },
+
+  /**
+   * @param {Object} [opts]
+   * @param {Object} [opts.filters]
+   * @param {string|string[]} [opts.filters.authors]
+   * @param {string} [opts.filters.visibility]
+   * @param {string} [opts.sortBy]
+   * @param {number} [opts.offset=0]
+   * @param {number} [opts.limit]
+   * @param {boolean} [opts.reverse]
+   * @returns {Promise<TagPublicAPIRecord[]>}
+   */
+  async listDiscussionTags (opts) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    opts = (opts && typeof opts === 'object') ? opts : {}
+    if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
+    if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+    if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+    if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+    if (opts && opts.filters) {
+      if ('authors' in opts.filters) {
+        if (Array.isArray(opts.filters.authors)) {
+          assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        }
+      }
+      if ('visibility' in opts.filters) {
+        assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+      }
+    }
+    var tags = await tagsCrawler.listDiscussionTags(opts)
+    return tags.map(massageTagRecord)
+  },
+
+  /**
+   * @param {Object} [opts]
+   * @param {Object} [opts.filters]
+   * @param {string|string[]} [opts.filters.authors]
+   * @param {string|string[]} [opts.filters.subtypes]
+   * @param {string} [opts.filters.visibility]
+   * @param {string} [opts.sortBy]
+   * @param {number} [opts.offset=0]
+   * @param {number} [opts.limit]
+   * @param {boolean} [opts.reverse]
+   * @returns {Promise<TagPublicAPIRecord[]>}
+   */
+  async listMediaTags (opts) {
+    await assertPermission(this.sender, 'dangerousAppControl')
+    opts = (opts && typeof opts === 'object') ? opts : {}
+    if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
+    if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
+    if (opts && 'limit' in opts) assert(typeof opts.limit === 'number', 'Limit must be a number')
+    if (opts && 'reverse' in opts) assert(typeof opts.reverse === 'boolean', 'Reverse must be a boolean')
+    if (opts && opts.filters) {
+      if ('authors' in opts.filters) {
+        if (Array.isArray(opts.filters.authors)) {
+          assert(opts.filters.authors.every(v => typeof v === 'string'), 'Authors filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
+        }
+      }
+      if ('subtypes' in opts.filters) {
+        if (Array.isArray(opts.filters.subtypes)) {
+          assert(opts.filters.subtypes.every(v => typeof v === 'string'), 'Subtypes filter must be a string or array of strings')
+        } else {
+          assert(typeof opts.filters.subtypes === 'string', 'Subtypes filter must be a string or array of strings')
+        }
+      }
+      if ('visibility' in opts.filters) {
+        assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
+      }
+    }
+    var tags = await tagsCrawler.listMediaTags(opts)
+    return tags.map(massageTagRecord)
+  }
+}
+
+// internal methods
+// =
+
+async function assertPermission (sender, perm) {
+  if (sender.getURL().startsWith('beaker:')) {
+    return true
+  }
+  if (await globals.permsAPI.requestPermission(perm, sender)) return true
+  throw new PermissionsError()
+}
+
+/**
+ * @param {Tag} tag
+ * @returns {TagPublicAPIRecord}
+ */
+function massageTagRecord (tag) {
+  if (!tag) return null
+  return {
+    tag: tag.tag,
+    count: tag.count
+  }
+}
\ No newline at end of file
diff --git a/web-apis/fg/navigator-import.js b/web-apis/fg/navigator-import.js
index 8cf26cf3..88927568 100644
--- a/web-apis/fg/navigator-import.js
+++ b/web-apis/fg/navigator-import.js
@@ -52,6 +52,10 @@ const APIs = {
     manifest: require('../manifests/external/unwalled-garden-reactions'),
     create: makeCreateFn('unwalled-garden-reactions')
   },
+  'unwalled-garden-tags': {
+    manifest: require('../manifests/external/unwalled-garden-tags'),
+    create: makeCreateFn('unwalled-garden-tags')
+  },
   'unwalled-garden-votes': {
     manifest: require('../manifests/external/unwalled-garden-votes'),
     create: makeCreateFn('unwalled-garden-votes')
diff --git a/web-apis/manifests/external/unwalled-garden-tags.js b/web-apis/manifests/external/unwalled-garden-tags.js
new file mode 100644
index 00000000..599c7608
--- /dev/null
+++ b/web-apis/manifests/external/unwalled-garden-tags.js
@@ -0,0 +1,5 @@
+module.exports = {
+  listBookmarkTags: 'promise',
+  listDiscussionTags: 'promise',
+  listMediaTags: 'promise'
+}
\ No newline at end of file

From 83b4b7e8481cbaed2581e8547eeb0e316f2566c5 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 24 Jun 2019 21:05:27 -0500
Subject: [PATCH 193/245] Fix tags filters

---
 crawler/bookmarks.js     | 10 +++++++++-
 crawler/discussions.js   | 13 +++++++++----
 crawler/media.js         | 13 +++++++++----
 web-apis/bg/bookmarks.js | 12 ++++++------
 4 files changed, 33 insertions(+), 15 deletions(-)

diff --git a/crawler/bookmarks.js b/crawler/bookmarks.js
index 60c38077..5be19075 100644
--- a/crawler/bookmarks.js
+++ b/crawler/bookmarks.js
@@ -209,7 +209,15 @@ exports.query = async function (opts) {
 
   // execute query
   var rows = await db.all(sql)
-  return Promise.all(rows.map(massageBookmarkRow))
+  var bookmarks = await Promise.all(rows.map(massageBookmarkRow))
+
+  // apply tags filter
+  if (opts && opts.filters && opts.filters.tags) {
+    const someFn = t => opts.filters.tags.includes(t)
+    bookmarks = bookmarks.filter(bookmark => bookmark.tags.some(someFn))
+  }
+
+  return bookmarks
 }
 
 /**
diff --git a/crawler/discussions.js b/crawler/discussions.js
index 2fedfc7b..a4b99002 100644
--- a/crawler/discussions.js
+++ b/crawler/discussions.js
@@ -238,15 +238,20 @@ exports.list = async function (opts) {
   if (opts && opts.filters && opts.filters.authors) {
     sql = sql.whereIn('crawl_sources.url', opts.filters.authors)
   }
-  if (opts && opts.filters && opts.filters.tags) {
-    sql = sql.whereIn('crawl_tags.tag', opts.filters.tags)
-  }
   if (opts && opts.limit) sql = sql.limit(opts.limit)
   if (opts && opts.offset) sql = sql.offset(opts.offset)
 
   // execute query
   var rows = await db.all(sql)
-  return Promise.all(rows.map(massageDiscussionRow))
+  var discussions = await Promise.all(rows.map(massageDiscussionRow))
+
+  // apply tags filter
+  if (opts && opts.filters && opts.filters.tags) {
+    const someFn = t => opts.filters.tags.includes(t)
+    discussions = discussions.filter(discussion => discussion.tags.some(someFn))
+  }
+
+  return discussions
 }
 
 /**
diff --git a/crawler/media.js b/crawler/media.js
index 11f351b8..7d018a7a 100644
--- a/crawler/media.js
+++ b/crawler/media.js
@@ -266,15 +266,20 @@ exports.list = async function (opts) {
   if (opts && opts.filters && opts.filters.subtypes) {
     sql = sql.whereIn('crawl_media.subtype', opts.filters.subtypes)
   }
-  if (opts && opts.filters && opts.filters.tags) {
-    sql = sql.whereIn('crawl_tags.tag', opts.filters.tags)
-  }
   if (opts && opts.limit) sql = sql.limit(opts.limit)
   if (opts && opts.offset) sql = sql.offset(opts.offset)
 
   // execute query
   var rows = await db.all(sql)
-  return Promise.all(rows.map(massageMediaRow))
+  var media = await Promise.all(rows.map(massageMediaRow))
+
+  // apply tags filter
+  if (opts && opts.filters && opts.filters.tags) {
+    const someFn = t => opts.filters.tags.includes(t)
+    media = media.filter(m => m.tags.some(someFn))
+  }
+
+  return media
 }
 
 /**
diff --git a/web-apis/bg/bookmarks.js b/web-apis/bg/bookmarks.js
index dc91e9c5..cba17ab1 100644
--- a/web-apis/bg/bookmarks.js
+++ b/web-apis/bg/bookmarks.js
@@ -39,7 +39,7 @@ module.exports = {
    * @param {Object} [opts]
    * @param {Object} [opts.filters]
    * @param {string|string[]} [opts.filters.authors]
-   * @param {string|string[]} [opts.filters.tag]
+   * @param {string|string[]} [opts.filters.tags]
    * @param {boolean} [opts.filters.pinned]
    * @param {boolean} [opts.filters.isPublic]
    * @param {string} [opts.sortBy] - 'title' or 'createdAt' (default 'title')
@@ -64,7 +64,7 @@ module.exports = {
     var user = await siteDescriptions.getBest({subject: userSession.url, author: userSession.url})
 
     // massage params
-    var tagFilter = _get(opts, 'filters.tag', undefined)
+    var tagsFilter = _get(opts, 'filters.tags', undefined)
     var pinnedFilter = _get(opts, 'filters.pinned', undefined)
     var publicFilter = _get(opts, 'filters.isPublic', undefined)
     var authorsFilter = _get(opts, 'filters.authors', undefined)
@@ -99,13 +99,13 @@ module.exports = {
     }
 
     // apply tag filter
-    if (tagFilter) {
-      if (Array.isArray(tagFilter)) {
+    if (tagsFilter) {
+      if (Array.isArray(tagsFilter)) {
         bookmarks = bookmarks.filter(b => {
-          return /** @type string[] */(tagFilter).reduce((agg, t) => agg && b.tags.includes(t), true)
+          return /** @type string[] */(tagsFilter).reduce((agg, t) => agg && b.tags.includes(t), true)
         })
       } else {
-        bookmarks = bookmarks.filter(b => b.tags.includes(tagFilter))
+        bookmarks = bookmarks.filter(b => b.tags.includes(tagsFilter))
       }
     }
 

From b64f411524deef9765de57a53c9e8def37166d21 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 25 Jun 2019 11:52:18 -0500
Subject: [PATCH 194/245] Add navigator beakerSelectDatArchiveDialog and
 beakerSelectFileDialog

---
 web-apis/bg.js                           |  3 +
 web-apis/bg/navigator.js                 | 99 ++++++++++++++++++++++++
 web-apis/fg.js                           |  2 +
 web-apis/fg/navigator-methods.js         | 11 +++
 web-apis/manifests/external/navigator.js |  4 +
 5 files changed, 119 insertions(+)
 create mode 100644 web-apis/bg/navigator.js
 create mode 100644 web-apis/fg/navigator-methods.js
 create mode 100644 web-apis/manifests/external/navigator.js

diff --git a/web-apis/bg.js b/web-apis/bg.js
index 12a2835d..fd93bae0 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -23,6 +23,7 @@ const templatesAPI = require('./bg/templates')
 const crawlerAPI = require('../crawler').WEBAPI
 
 // external manifests
+const navigatorManifest = require('./manifests/external/navigator')
 const datArchiveManifest = require('./manifests/external/dat-archive')
 const spellCheckerManifest = require('./manifests/external/spell-checker')
 const bookmarksManifest = require('./manifests/external/bookmarks')
@@ -39,6 +40,7 @@ const tagsManifest = require('./manifests/external/unwalled-garden-tags')
 const votesManifest = require('./manifests/external/unwalled-garden-votes')
 
 // external apis
+const navigatorAPI = require('./bg/navigator')
 const datArchiveAPI = require('./bg/dat-archive')
 const spellCheckerAPI = require('./bg/spell-checker')
 const bookmarksAPI = require('./bg/bookmarks')
@@ -80,6 +82,7 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('crawler', crawlerManifest, crawlerAPI, internalOnly)
 
   // external apis
+  globals.rpcAPI.exportAPI('navigator', navigatorManifest, navigatorAPI, secureOnly)
   globals.rpcAPI.exportAPI('dat-archive', datArchiveManifest, datArchiveAPI, secureOnly)
   globals.rpcAPI.exportAPI('spell-checker', spellCheckerManifest, spellCheckerAPI)
   globals.rpcAPI.exportAPI('bookmarks', bookmarksManifest, bookmarksAPI, secureOnly)
diff --git a/web-apis/bg/navigator.js b/web-apis/bg/navigator.js
new file mode 100644
index 00000000..9fd68d43
--- /dev/null
+++ b/web-apis/bg/navigator.js
@@ -0,0 +1,99 @@
+const globals = require('../../globals')
+const assert = require('assert')
+const { UserDeniedError } = require('beaker-error-constants')
+
+// exported api
+// =
+
+module.exports = {
+  /**
+   * @param {Object} [opts]
+   * @param {string} [opts.title]
+   * @param {string} [opts.buttonLabel]
+   * @param {string} [opts.archive]
+   * @param {string} [opts.defaultPath]
+   * @param {string[]} [opts.select]
+   * @param {Object} [opts.filters]
+   * @param {string[]} [opts.filters.extensions]
+   * @param {boolean} [opts.filters.writable]
+   * @param {boolean} [opts.filters.networked]
+   * @param {boolean} [opts.allowMultiple]
+   * @param {boolean} [opts.disallowCreate]
+   * @returns {Promise<string[]>}
+   */
+  async beakerSelectFileDialog (opts = {}) {
+    var userSession = globals.userSessionAPI.getFor(this.sender)
+    if (!userSession) throw new Error('No active user session')
+
+    // validate
+    assert(opts && typeof opts === 'object', 'Must pass an options object')
+    assert(!opts.title || typeof opts.title === 'string', '.title must be a string')
+    assert(!opts.buttonLabel || typeof opts.buttonLabel === 'string', '.buttonLabel must be a string')
+    assert(!opts.archive || typeof opts.archive === 'string', '.archive must be a string')
+    assert(!opts.defaultPath || typeof opts.defaultPath === 'string', '.defaultPath must be a string')
+    assert(!opts.select || isStrArray(opts.select), '.select must be an array of strings')
+    if (opts.filters) {
+      assert(typeof opts.filters === 'object', '.filters must be an object')
+      assert(!opts.filters.extensions || isStrArray(opts.filters.extensions), '.filters.extensions must be an array of strings')
+      assert(!opts.filters.writable || typeof opts.filters.writable === 'boolean', '.filters.writable must be a boolean')
+      assert(!opts.filters.networked || typeof opts.filters.networked === 'boolean', '.filters.networked must be a boolean')
+    }
+    assert(!opts.allowMultiple || typeof opts.allowMultiple === 'boolean', '.filters.allowMultiple must be a boolean')
+    assert(!opts.disallowCreate || typeof opts.disallowCreate === 'boolean', '.filters.disallowCreate must be a boolean')
+
+    // set defaults
+    if (!opts.archive) {
+      opts.archive = userSession.url
+    }
+
+    // initiate the modal
+    var res
+    try {
+      res = await globals.uiAPI.showModal(this.sender, 'select-file', opts)
+    } catch (e) {
+      console.log(e)
+      if (e.name !== 'Error') {
+        throw e // only rethrow if a specific error
+      }
+    }
+    if (!res || !res.paths) throw new UserDeniedError()
+    return res.paths
+  },
+
+  /**
+   * @param {Object} [opts]
+   * @param {string} [opts.title]
+   * @param {string} [opts.buttonLabel]
+   * @param {Object} [opts.filters]
+   * @param {boolean} [opts.filters.writable]
+   * @param {string} [opts.filters.type]
+   * @returns {Promise<string[]>}
+   */
+  async beakerSelectDatArchiveDialog (opts = {}) {
+    // validate
+    assert(opts && typeof opts === 'object', 'Must pass an options object')
+    assert(!opts.title || typeof opts.title === 'string', '.title must be a string')
+    assert(!opts.buttonLabel || typeof opts.buttonLabel === 'string', '.buttonLabel must be a string')
+    if (opts.filters) {
+      assert(typeof opts.filters === 'object', '.filters must be an object')
+      assert(!opts.filters.type || typeof opts.filters.type === 'string', '.filters.type must be a string')
+      assert(!opts.filters.writable || typeof opts.filters.writable === 'boolean', '.filters.writable must be a boolean')
+    }
+
+    // initiate the modal
+    var res
+    try {
+      res = await globals.uiAPI.showModal(this.sender, 'select-archive', opts)
+    } catch (e) {
+      if (e.name !== 'Error') {
+        throw e // only rethrow if a specific error
+      }
+    }
+    if (!res || !res.url) throw new UserDeniedError()
+    return res.url
+  }
+}
+
+function isStrArray (v) {
+  return (Array.isArray(v) && v.every(el => typeof el === 'string'))
+}
\ No newline at end of file
diff --git a/web-apis/fg.js b/web-apis/fg.js
index 21c65eed..9ee885df 100644
--- a/web-apis/fg.js
+++ b/web-apis/fg.js
@@ -2,12 +2,14 @@ const DatArchive = require('./fg/dat-archive')
 const beaker = require('./fg/beaker')
 const experimental = require('./fg/experimental')
 const navigatorImport = require('./fg/navigator-import')
+const navigatorMethods = require('./fg/navigator-methods')
 
 exports.setup = function ({rpcAPI}) {
   // setup APIs
   if (['beaker:', 'dat:', 'https:'].includes(window.location.protocol) ||
       (window.location.protocol === 'http:' && window.location.hostname === 'localhost')) {
     window.DatArchive = DatArchive.setup(rpcAPI)
+    navigatorMethods.setup(rpcAPI)
   }
   if (['beaker:', 'dat:'].includes(window.location.protocol)) {
     window.beaker = beaker.setup(rpcAPI)
diff --git a/web-apis/fg/navigator-methods.js b/web-apis/fg/navigator-methods.js
new file mode 100644
index 00000000..2242c7f7
--- /dev/null
+++ b/web-apis/fg/navigator-methods.js
@@ -0,0 +1,11 @@
+const errors = require('beaker-error-constants')
+const manifest = require('../manifests/external/navigator')
+
+const RPC_OPTS = { timeout: false, errors }
+
+exports.setup = function (rpc) {
+  var api = rpc.importAPI('navigator', manifest, RPC_OPTS)
+  for (let k in manifest) {
+    navigator[k] = api[k].bind(api)
+  }
+}
diff --git a/web-apis/manifests/external/navigator.js b/web-apis/manifests/external/navigator.js
new file mode 100644
index 00000000..14685157
--- /dev/null
+++ b/web-apis/manifests/external/navigator.js
@@ -0,0 +1,4 @@
+module.exports = {
+  beakerSelectFileDialog: 'promise',
+  beakerSelectDatArchiveDialog: 'promise'
+}
\ No newline at end of file

From 3b305bb1c759f98f570bf69c8904f95bfb9afa34 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 25 Jun 2019 14:18:51 -0500
Subject: [PATCH 195/245] Add navigator.beakerSaveFileDialog

---
 web-apis/bg/navigator.js                 | 49 +++++++++++++++++++++++-
 web-apis/manifests/external/navigator.js |  1 +
 2 files changed, 49 insertions(+), 1 deletion(-)

diff --git a/web-apis/bg/navigator.js b/web-apis/bg/navigator.js
index 9fd68d43..3235afee 100644
--- a/web-apis/bg/navigator.js
+++ b/web-apis/bg/navigator.js
@@ -51,7 +51,6 @@ module.exports = {
     try {
       res = await globals.uiAPI.showModal(this.sender, 'select-file', opts)
     } catch (e) {
-      console.log(e)
       if (e.name !== 'Error') {
         throw e // only rethrow if a specific error
       }
@@ -59,6 +58,54 @@ module.exports = {
     if (!res || !res.paths) throw new UserDeniedError()
     return res.paths
   },
+  /**
+   * @param {Object} [opts]
+   * @param {string} [opts.title]
+   * @param {string} [opts.buttonLabel]
+   * @param {string} [opts.archive]
+   * @param {string} [opts.defaultPath]
+   * @param {string} [opts.defaultFilename]
+   * @param {string} [opts.extension]
+   * @param {Object} [opts.filters]
+   * @param {string[]} [opts.filters.extensions]
+   * @param {boolean} [opts.filters.networked]
+   * @returns {Promise<string[]>}
+   */
+  async beakerSaveFileDialog (opts = {}) {
+    var userSession = globals.userSessionAPI.getFor(this.sender)
+    if (!userSession) throw new Error('No active user session')
+
+    // validate
+    assert(opts && typeof opts === 'object', 'Must pass an options object')
+    assert(!opts.title || typeof opts.title === 'string', '.title must be a string')
+    assert(!opts.buttonLabel || typeof opts.buttonLabel === 'string', '.buttonLabel must be a string')
+    assert(!opts.archive || typeof opts.archive === 'string', '.archive must be a string')
+    assert(!opts.defaultPath || typeof opts.defaultPath === 'string', '.defaultPath must be a string')
+    assert(!opts.defaultFilename || typeof opts.defaultFilename === 'string', '.defaultFilename must be a string')
+    if (opts.filters) {
+      assert(typeof opts.filters === 'object', '.filters must be an object')
+      assert(!opts.filters.extensions || isStrArray(opts.filters.extensions), '.filters.extensions must be an array of strings')
+      assert(!opts.filters.networked || typeof opts.filters.networked === 'boolean', '.filters.networked must be a boolean')
+    }
+
+    // set defaults
+    if (!opts.archive) {
+      opts.archive = userSession.url
+    }
+
+    // initiate the modal
+    opts.saveMode = true
+    var res
+    try {
+      res = await globals.uiAPI.showModal(this.sender, 'select-file', opts)
+    } catch (e) {
+      if (e.name !== 'Error') {
+        throw e // only rethrow if a specific error
+      }
+    }
+    if (!res || !res.path) throw new UserDeniedError()
+    return res.path
+  },
 
   /**
    * @param {Object} [opts]
diff --git a/web-apis/manifests/external/navigator.js b/web-apis/manifests/external/navigator.js
index 14685157..c9c1e4b1 100644
--- a/web-apis/manifests/external/navigator.js
+++ b/web-apis/manifests/external/navigator.js
@@ -1,4 +1,5 @@
 module.exports = {
   beakerSelectFileDialog: 'promise',
+  beakerSaveFileDialog: 'promise',
   beakerSelectDatArchiveDialog: 'promise'
 }
\ No newline at end of file

From 3abb09e01a4dd42e84e2bcd3408263a053251258 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 25 Jun 2019 19:06:28 -0500
Subject: [PATCH 196/245] Add getArchiveNetworkStats to dat daemon

---
 dat/daemon/index.js    | 6 ++++++
 dat/daemon/manifest.js | 2 ++
 2 files changed, 8 insertions(+)

diff --git a/dat/daemon/index.js b/dat/daemon/index.js
index 210d916e..de49631e 100644
--- a/dat/daemon/index.js
+++ b/dat/daemon/index.js
@@ -182,6 +182,12 @@ const RPC_API = {
     }
   },
 
+  async getArchiveNetworkStats (key) {
+    var archive = getArchive(key)
+    if (!archive) return {}
+    return archive.networkStats
+  },
+
   updateSizeTracking,
 
   async loadArchive (opts) {
diff --git a/dat/daemon/manifest.js b/dat/daemon/manifest.js
index 40c18e0d..09a78f27 100644
--- a/dat/daemon/manifest.js
+++ b/dat/daemon/manifest.js
@@ -10,6 +10,7 @@
  * @prop {function(string): Promise<string>} getDebugLog
  * @prop {function(string | Buffer, LibraryArchiveUserSettings): Promise<void>} configureArchive
  * @prop {function(string | Buffer): Promise<DatDaemonArchiveInfo>} getArchiveInfo
+ * @prop {function(string | Buffer): Promise<DatDaemonNetworkStats>} getArchiveNetworkStats
  * @prop {function(string | Buffer): Promise<number>} updateSizeTracking
  * @prop {function(DatDaemonLoadArchiveOpts): Promise<DatDaemonLoadedArchiveInfo>} loadArchive
  * @prop {function(string): Promise<void>} unloadArchive
@@ -112,6 +113,7 @@ module.exports = {
 
   configureArchive: 'promise',
   getArchiveInfo: 'promise',
+  getArchiveNetworkStats: 'promise',
   updateSizeTracking: 'promise',
   loadArchive: 'promise',
   unloadArchive: 'promise',

From 0530338d567618f864029d06385d95a3c700aa1a Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 26 Jun 2019 12:39:33 -0500
Subject: [PATCH 197/245] Fix: Delete vote when set to 0

---
 crawler/votes.js | 39 +++++++++++++++++++++++----------------
 1 file changed, 23 insertions(+), 16 deletions(-)

diff --git a/crawler/votes.js b/crawler/votes.js
index 5c47b9ae..f13a6ede 100644
--- a/crawler/votes.js
+++ b/crawler/votes.js
@@ -320,25 +320,32 @@ exports.set = async function (archive, topic, vote) {
 
   // get the existing vote if it exists
   let existingVote = await get(archive.url, topic)
+  var filename = existingVote ? existingVote.createdAt : generateTimeFilename()
+  var filepath = `/data/votes/${filename}.json`
 
-  var voteObject = {
-    type: JSON_TYPE,
-    topic: normalizeTopicUrl(topic),
-    vote,
-    createdAt: existingVote ? existingVote.createdAt : (new Date()).toISOString()
-  }
-  if (existingVote) {
-    voteObject.updatedAt = (new Date()).toISOString()
-  }
+  if (vote === 0) {
+    // delete vote
+    if (!existingVote) return
+    await archive.pda.unlink(filepath)
+  } else {
+    // set new vote
+    var voteObject = {
+      type: JSON_TYPE,
+      topic: normalizeTopicUrl(topic),
+      vote,
+      createdAt: existingVote ? existingVote.createdAt : (new Date()).toISOString()
+    }
+    if (existingVote) {
+      voteObject.updatedAt = (new Date()).toISOString()
+    }
 
-  var valid = validateVote(voteObject)
-  if (!valid) throw ajv.errorsText(validateVote.errors)
+    var valid = validateVote(voteObject)
+    if (!valid) throw ajv.errorsText(validateVote.errors)
 
-  var filename = existingVote ? existingVote.createdAt : generateTimeFilename()
-  var filepath = `/data/votes/${filename}.json`
-  await ensureDirectory(archive, '/data')
-  await ensureDirectory(archive, '/data/votes')
-  await archive.pda.writeFile(filepath, JSON.stringify(voteObject, null, 2))
+    await ensureDirectory(archive, '/data')
+    await ensureDirectory(archive, '/data/votes')
+    await archive.pda.writeFile(filepath, JSON.stringify(voteObject, null, 2))
+  }
   await crawler.crawlSite(archive)
 }
 

From fa4a43b68bebc6c7a1a79537d371cf5c88b7e997 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 26 Jun 2019 12:39:54 -0500
Subject: [PATCH 198/245] Fix: add getArchiveNetworkStats to library

---
 dat/library.js | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/dat/library.js b/dat/library.js
index acfb6843..fa4fe22d 100644
--- a/dat/library.js
+++ b/dat/library.js
@@ -546,6 +546,11 @@ exports.getArchiveInfo = async function getArchiveInfo (key) {
   return meta
 }
 
+exports.getArchiveNetworkStats = async function getArchiveNetworkStats (key) {
+  key = fromURLToKey(key)
+  return daemon.getArchiveNetworkStats(key)
+}
+
 exports.clearFileCache = async function clearFileCache (key) {
   var userSettings = await archivesDb.getUserSettings(0, key)
   return daemon.clearFileCache(key, userSettings)

From 0dd1baff76ba09d1253ea3709b03f5c4f0383b07 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 26 Jun 2019 12:40:01 -0500
Subject: [PATCH 199/245] Remove log

---
 lib/zip.js | 1 -
 1 file changed, 1 deletion(-)

diff --git a/lib/zip.js b/lib/zip.js
index 91306f65..51004cbd 100644
--- a/lib/zip.js
+++ b/lib/zip.js
@@ -31,7 +31,6 @@ exports.toZipStream = function (archive, dirpath = '/') {
       }
 
       // pipe each entry into the zip
-      console.log('go go go', readPath, path)
       zipfile.addBuffer(await archive.pda.readFile(readPath, 'binary'), path)
       // NOTE
       // for some reason using archive.createReadStream() to feed into the zipfile addReadStream() was not working with multiple files

From 6792d3b7526fa07cd92aea5fee4b30c98533680b Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 26 Jun 2019 12:40:23 -0500
Subject: [PATCH 200/245] Dat protocol serving: go back to simple files listing
 when no index.html is found

---
 dat/protocol.js | 37 +++++++++++++++++++++++--------------
 1 file changed, 23 insertions(+), 14 deletions(-)

diff --git a/dat/protocol.js b/dat/protocol.js
index f6a3a5ff..f5985370 100644
--- a/dat/protocol.js
+++ b/dat/protocol.js
@@ -252,22 +252,31 @@ exports.electronHandler = async function (request, respond) {
   if (entry && entry.isDirectory()) {
     cleanup()
 
-    // by default, redirect to the library files view
-    let Location = `beaker://library?view=files&dat=${encodeURIComponent(`dat://${urlp.host}${urlp.version ? ('+' + urlp.version) : ''}`)}&path=${encodeURIComponent(urlp.pathname || '')}`
-
-    // for known types, redirect to their preferred interfaces
-    if (!filepath || filepath === '/') {
-      if (manifest.type && manifest.type.includes('unwalled.garden/person')) {
-        Location = `dat://beaker.social/profile/${encodeURIComponent(`dat://${urlp.host}`)}`
-      }
+    // make sure there's a trailing slash
+    if (!hasTrailingSlash) {
+      return respond({
+        statusCode: 303,
+        headers: {
+          Location: `dat://${urlp.host}${urlp.version ? ('+' + urlp.version) : ''}${urlp.pathname || ''}/${urlp.search || ''}`
+        },
+        data: intoStream('')
+      })
     }
 
-    // redirect to the library files view
-    return respond({
-      statusCode: 303,
-      headers: {Location},
-      data: intoStream('')
-    })
+    let headers = {
+      'Content-Type': 'text/html',
+      'Content-Security-Policy': cspHeader,
+      'Access-Control-Allow-Origin': '*'
+    }
+    if (request.method === 'HEAD') {
+      return respond({statusCode: 204, headers, data: intoStream('')})
+    } else {
+      return respond({
+        statusCode: 200,
+        headers,
+        data: intoStream(await directoryListingPage(checkoutFS, filepath, manifest && manifest.web_root))
+      })
+    }
   }
 
   // handle not found

From 8b284c0bf75b6de541c154df9e20887f20cc39da Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 26 Jun 2019 20:23:29 -0500
Subject: [PATCH 201/245] Fix: massage comment replies in threads

---
 web-apis/bg/unwalled-garden-comments.js | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/web-apis/bg/unwalled-garden-comments.js b/web-apis/bg/unwalled-garden-comments.js
index a3a78950..0b06b5b4 100644
--- a/web-apis/bg/unwalled-garden-comments.js
+++ b/web-apis/bg/unwalled-garden-comments.js
@@ -284,7 +284,7 @@ function massageThreadedCommentRecord (comment) {
     topic: comment.topic,
     replyTo: comment.replyTo,
     body: comment.body,
-    replies: comment.replies,
+    replies: comment.replies ? comment.replies.map(massageThreadedCommentRecord) : null,
     replyCount: comment.replyCount,
     createdAt: comment.createdAt,
     updatedAt: comment.updatedAt,

From 7d1d1cccbe810504b932ec3a704c8e1081c18c6d Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 29 Jun 2019 11:56:03 -0500
Subject: [PATCH 202/245] Remove old user-session web api

---
 web-apis/bg/user-session.js                 | 13 -------------
 web-apis/manifests/external/user-session.js |  3 ---
 2 files changed, 16 deletions(-)
 delete mode 100644 web-apis/bg/user-session.js
 delete mode 100644 web-apis/manifests/external/user-session.js

diff --git a/web-apis/bg/user-session.js b/web-apis/bg/user-session.js
deleted file mode 100644
index 63d9e6e8..00000000
--- a/web-apis/bg/user-session.js
+++ /dev/null
@@ -1,13 +0,0 @@
-const {getAppPermissions} = require('../../dbs/sitedata')
-
-// exported api
-// =
-
-module.exports = {
-  // fetch the sender's session data
-  async fetch () {
-    return {
-      permissions: await getAppPermissions(this.sender.getURL())
-    }
-  }
-}
diff --git a/web-apis/manifests/external/user-session.js b/web-apis/manifests/external/user-session.js
deleted file mode 100644
index 26c3db4e..00000000
--- a/web-apis/manifests/external/user-session.js
+++ /dev/null
@@ -1,3 +0,0 @@
-module.exports = {
-  fetch: 'promise'
-}

From cdfec1991396f31fe90e0d9986dd707ec685920b Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 29 Jun 2019 11:59:38 -0500
Subject: [PATCH 203/245] Change 'profiles' web api to
 'unwalled-garden-profiles'

---
 web-apis/bg.js                                            | 6 +++---
 web-apis/bg/{profiles.js => unwalled-garden-profiles.js}  | 0
 web-apis/fg/navigator-import.js                           | 8 ++++----
 .../external/{profiles.js => unwalled-garden-profiles.js} | 0
 4 files changed, 7 insertions(+), 7 deletions(-)
 rename web-apis/bg/{profiles.js => unwalled-garden-profiles.js} (100%)
 rename web-apis/manifests/external/{profiles.js => unwalled-garden-profiles.js} (100%)

diff --git a/web-apis/bg.js b/web-apis/bg.js
index fd93bae0..a9f4700c 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -28,13 +28,13 @@ const datArchiveManifest = require('./manifests/external/dat-archive')
 const spellCheckerManifest = require('./manifests/external/spell-checker')
 const bookmarksManifest = require('./manifests/external/bookmarks')
 const libraryManifest = require('./manifests/external/library')
-const profilesManifest = require('./manifests/external/profiles')
 const searchManifest = require('./manifests/external/search')
 const commentsManifest = require('./manifests/external/unwalled-garden-comments')
 const discussionsManifest = require('./manifests/external/unwalled-garden-discussions')
 const followsManifest = require('./manifests/external/unwalled-garden-follows')
 const mediaManifest = require('./manifests/external/unwalled-garden-media')
 const postsManifest = require('./manifests/external/unwalled-garden-posts')
+const profilesManifest = require('./manifests/external/unwalled-garden-profiles')
 const reactionsManifest = require('./manifests/external/unwalled-garden-reactions')
 const tagsManifest = require('./manifests/external/unwalled-garden-tags')
 const votesManifest = require('./manifests/external/unwalled-garden-votes')
@@ -45,13 +45,13 @@ const datArchiveAPI = require('./bg/dat-archive')
 const spellCheckerAPI = require('./bg/spell-checker')
 const bookmarksAPI = require('./bg/bookmarks')
 const libraryAPI = require('./bg/library')
-const profilesAPI = require('./bg/profiles')
 const searchAPI = require('./bg/search')
 const commentsAPI = require('./bg/unwalled-garden-comments')
 const discussionsAPI = require('./bg/unwalled-garden-discussions')
 const followsAPI = require('./bg/unwalled-garden-follows')
 const mediaAPI = require('./bg/unwalled-garden-media')
 const postsAPI = require('./bg/unwalled-garden-posts')
+const profilesAPI = require('./bg/unwalled-garden-profiles')
 const reactionsAPI = require('./bg/unwalled-garden-reactions')
 const tagsAPI = require('./bg/unwalled-garden-tags')
 const votesAPI = require('./bg/unwalled-garden-votes')
@@ -87,13 +87,13 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('spell-checker', spellCheckerManifest, spellCheckerAPI)
   globals.rpcAPI.exportAPI('bookmarks', bookmarksManifest, bookmarksAPI, secureOnly)
   globals.rpcAPI.exportAPI('library', libraryManifest, libraryAPI, secureOnly)
-  globals.rpcAPI.exportAPI('profiles', profilesManifest, profilesAPI, secureOnly)
   globals.rpcAPI.exportAPI('search', searchManifest, searchAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-comments', commentsManifest, commentsAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-discussions', discussionsManifest, discussionsAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-follows', followsManifest, followsAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-media', mediaManifest, mediaAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-posts', postsManifest, postsAPI, secureOnly)
+  globals.rpcAPI.exportAPI('unwalled-garden-profiles', profilesManifest, profilesAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-reactions', reactionsManifest, reactionsAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-tags', tagsManifest, tagsAPI, secureOnly)
   globals.rpcAPI.exportAPI('unwalled-garden-votes', votesManifest, votesAPI, secureOnly)
diff --git a/web-apis/bg/profiles.js b/web-apis/bg/unwalled-garden-profiles.js
similarity index 100%
rename from web-apis/bg/profiles.js
rename to web-apis/bg/unwalled-garden-profiles.js
diff --git a/web-apis/fg/navigator-import.js b/web-apis/fg/navigator-import.js
index 88927568..d8defba1 100644
--- a/web-apis/fg/navigator-import.js
+++ b/web-apis/fg/navigator-import.js
@@ -20,10 +20,6 @@ const APIs = {
       return api
     }
   },
-  profiles: {
-    manifest: require('../manifests/external/profiles'),
-    create: makeCreateFn('profiles')
-  },
   search: {
     manifest: require('../manifests/external/search'),
     create: makeCreateFn('search')
@@ -48,6 +44,10 @@ const APIs = {
     manifest: require('../manifests/external/unwalled-garden-posts'),
     create: makeCreateFn('unwalled-garden-posts')
   },
+  'unwalled-garden-profiles': {
+    manifest: require('../manifests/external/unwalled-garden-profiles'),
+    create: makeCreateFn('unwalled-garden-profiles')
+  },
   'unwalled-garden-reactions': {
     manifest: require('../manifests/external/unwalled-garden-reactions'),
     create: makeCreateFn('unwalled-garden-reactions')
diff --git a/web-apis/manifests/external/profiles.js b/web-apis/manifests/external/unwalled-garden-profiles.js
similarity index 100%
rename from web-apis/manifests/external/profiles.js
rename to web-apis/manifests/external/unwalled-garden-profiles.js

From ac78acd486c6a2539c090c8f9ac1b8d11dd38dc4 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 1 Jul 2019 14:38:42 -0500
Subject: [PATCH 204/245] Add multiple-user support and beaker.users API

---
 dbs/profile-data-db.js                 |   3 +-
 dbs/schemas/profile-data.sql.js        |   4 +-
 dbs/schemas/profile-data.v33.sql.js    |   9 ++
 users/index.js                         | 128 +++++++++++++---
 web-apis/bg.js                         |   3 +
 web-apis/bg/users.js                   | 203 +++++++++++++++++++++++++
 web-apis/fg/beaker.js                  |  16 +-
 web-apis/manifests/internal/browser.js |   2 +-
 web-apis/manifests/internal/users.js   |   4 +
 9 files changed, 350 insertions(+), 22 deletions(-)
 create mode 100644 dbs/schemas/profile-data.v33.sql.js
 create mode 100644 web-apis/bg/users.js

diff --git a/dbs/profile-data-db.js b/dbs/profile-data-db.js
index 3ec3ed3b..44f79696 100644
--- a/dbs/profile-data-db.js
+++ b/dbs/profile-data-db.js
@@ -119,7 +119,8 @@ migrations = [
   migration('profile-data.v29.sql'),
   migration('profile-data.v30.sql'),
   migration('profile-data.v31.sql'),
-  migration('profile-data.v32.sql')
+  migration('profile-data.v32.sql'),
+  migration('profile-data.v33.sql')
 ]
 function migration (file, opts = {}) {
   return cb => {
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index aa70c464..1d0c0933 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -7,8 +7,10 @@ CREATE TABLE profiles (
 
 CREATE TABLE users (
   id INTEGER PRIMARY KEY NOT NULL,
+  label TEXT,
   url TEXT,
   isDefault INTEGER DEFAULT 0,
+  isTemporary INTEGER DEFAULT 0,
   createdAt INTEGER
 );
 
@@ -441,5 +443,5 @@ INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Library', 'beaker://library/', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker.Social', 'dat://beaker.social', 1);
 
-PRAGMA user_version = 32;
+PRAGMA user_version = 33;
 `
diff --git a/dbs/schemas/profile-data.v33.sql.js b/dbs/schemas/profile-data.v33.sql.js
new file mode 100644
index 00000000..756ed185
--- /dev/null
+++ b/dbs/schemas/profile-data.v33.sql.js
@@ -0,0 +1,9 @@
+module.exports = `
+
+-- add label
+ALTER TABLE users ADD COLUMN label TEXT;
+-- add isTemporary
+ALTER TABLE users ADD COLUMN isTemporary INTEGER DEFAULT 0;
+
+PRAGMA user_version = 33;
+`
\ No newline at end of file
diff --git a/users/index.js b/users/index.js
index f4ab8299..6791bddf 100644
--- a/users/index.js
+++ b/users/index.js
@@ -1,3 +1,4 @@
+const assert = require('assert')
 const Events = require('events')
 const logger = require('../logger').category('crawler')
 const dat = require('../dat')
@@ -15,6 +16,7 @@ const _pick = require('lodash.pick')
 
 const CRAWL_TICK_INTERVAL = 5e3
 const NUM_SIMULTANEOUS_CRAWLS = 10
+const LABEL_REGEX = /[a-z0-9-]/i
 
 // typedefs
 // =
@@ -23,9 +25,11 @@ const NUM_SIMULTANEOUS_CRAWLS = 10
  * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
  *
  * @typedef {Object} User
+ * @prop {string} label
  * @prop {string} url
  * @prop {InternalDatArchive} archive
  * @prop {boolean} isDefault
+ * @prop {boolean} isTemporary
  * @prop {string} title
  * @prop {string} description
  * @prop {Date} createdAt
@@ -36,6 +40,7 @@ const NUM_SIMULTANEOUS_CRAWLS = 10
 
 var events = new Events()
 var users
+var nextCrawlUserIndex = 0
 
 // exported api
 // =
@@ -54,6 +59,17 @@ exports.setup = async function () {
   // load the current users
   users = await db.all(`SELECT * FROM users`)
   await Promise.all(users.map(async (user) => {
+    // old temporary?
+    if (user.isTemporary) {
+      // delete old temporary user
+      logger.info('Deleting temporary user', {details: user})
+      user.isInvalid = true // let invalid-user-deletion clean up the record
+      let key = dat.library.fromURLToKey(user.url)
+      await archivesDb.setUserSettings(0, key, {isSaved: false})
+      await dat.library.clearFileCache(key)
+      return
+    }
+
     // massage data
     user.url = normalizeUrl(user.url)
     user.archive = null
@@ -96,8 +112,9 @@ function queueTick () {
  */
 async function tick () {
   try {
-    // TODO handle multiple users
-    var user = users[0]
+    var user = users[nextCrawlUserIndex]
+    nextCrawlUserIndex++
+    if (nextCrawlUserIndex >= users.length) nextCrawlUserIndex = 0
     if (!user) return queueTick()
 
     // assemble the next set of crawl targets
@@ -150,7 +167,18 @@ exports.get = async function (url) {
   url = normalizeUrl(url)
   var user = users.find(user => user.url === url)
   if (!user) return null
-  return await fetchUserInfo(user)
+  return fetchUserInfo(user)
+}
+
+/**
+ * @param {string} label
+ * @return {Promise<User>}
+ */
+const getByLabel =
+exports.getByLabel = async function (label) {
+  var user = users.find(user => user.label === label)
+  if (!user) return null
+  return fetchUserInfo(user)
 }
 
 /**
@@ -160,33 +188,41 @@ const getDefault =
 exports.getDefault = async function () {
   var user = users.find(user => user.isDefault === true)
   if (!user) return null
-  return await fetchUserInfo(user)
+  return fetchUserInfo(user)
 }
 
 /**
+ * @param {string} label
  * @param {string} url
- * @returns {Promise<void>}
+ * @param {boolean} [setDefault=false]
+ * @param {boolean} [isTemporary=false]
+ * @returns {Promise<User>}
  */
-exports.add = async function (url) {
-  // make sure the user doesnt already exist
-  url = normalizeUrl(url)
-  var existingUser = await get(url)
-  if (existingUser) return
-
+exports.add = async function (label, url, setDefault = false, isTemporary = false) {
   // validate
+  validateUserLabel(label)
   await validateUserUrl(url)
 
+  // make sure the user label or URL doesnt already exist
+  url = normalizeUrl(url)
+  var existingUser = users.find(user => user.url === url)
+  if (existingUser) throw new Error('User already exists at that URL')
+  existingUser = users.find(user => user.label === label)
+  if (existingUser) throw new Error('User already exists at that label')
+
   // create the new user
   var user = {
+    label,
     url,
     archive: null,
-    isDefault: users.length === 0,
-    createdAt: Date.now()
+    isDefault: setDefault || users.length === 0,
+    isTemporary,
+    createdAt: new Date()
   }
   logger.verbose('Adding user', {details: user})
   await db.run(
-    `INSERT INTO users (url, isDefault, createdAt) VALUES (?, ?, ?)`,
-    [user.url, Number(user.isDefault), user.createdAt]
+    `INSERT INTO users (label, url, isDefault, isTemporary, createdAt) VALUES (?, ?, ?, ?, ?)`,
+    [user.label, user.url, Number(user.isDefault), Number(user.isTemporary), Number(user.createdAt)]
   )
   users.push(user)
 
@@ -194,6 +230,48 @@ exports.add = async function (url) {
   user.archive = await dat.library.getOrLoadArchive(user.url)
   startWatch(user)
   events.emit('load-user', user)
+  return fetchUserInfo(user)
+}
+
+/**
+ * @param {string} url
+ * @param {Object} opts
+ * @param {string} [opts.title]
+ * @param {string} [opts.description]
+ * @param {string} [opts.label]
+ * @param {boolean} [opts.setDefault]
+ * @returns {Promise<User>}
+ */
+exports.edit = async function (url, opts) {
+  // validate
+  await validateUserUrl(url)
+  if ('label' in opts) validateUserLabel(opts.label)
+
+  // make sure the user label or URL doesnt already exist
+  url = normalizeUrl(url)
+  var existingUser = users.find(user => user.label === opts.label)
+  if (existingUser && existingUser.url !== url) throw new Error('User already exists at that label')
+
+  // update the user
+  var user = users.find(user => user.url === url)
+  if (opts.title) user.title = opts.title
+  if (opts.description) user.description = opts.title
+  if (opts.setDefault) {
+    try { users.find(user => user.isDefault).isDefault = false }
+    catch (e) { /* ignore, no existing default */ }
+    user.isDefault = true
+    await db.run(`UPDATE users SET isDefault = 0 WHERE isDefault = 1`)
+    await db.run(`UPDATE users SET isDefault = 1 WHERE url = ?`, [user.url])
+  }
+  if (opts.label) {
+    user.label = opts.label
+    await db.run(`UPDATE users SET label = ? WHERE url = ?`, [opts.label, user.url])
+  }
+  logger.verbose('Updating user', {details: user})
+
+  // fetch the user archive
+  user.archive = await dat.library.getOrLoadArchive(user.url)
+  return fetchUserInfo(user)
 }
 
 /**
@@ -216,7 +294,7 @@ exports.remove = async function (url) {
 
 /**
  * @param {string} url
- * @return {Promise<boolean>}
+ * @return {boolean}
  */
 const isUser =
 exports.isUser = function (url) {
@@ -224,6 +302,15 @@ exports.isUser = function (url) {
   return !!users.find(user => user.url === url)
 }
 
+/**
+ * @param {string} label
+ */
+const validateUserLabel =
+exports.validateUserLabel = function (label) {
+  assert(label && typeof label === 'string', 'Label must be a non-empty string')
+  assert(LABEL_REGEX.test(label), 'Labels can only comprise of letters, numbers, and dashes')
+}
+
 // internal methods
 // =
 
@@ -258,13 +345,16 @@ async function selectNextCrawlTargets (user) {
   var foafUrls = (await followsCrawler.list({filters: {authors: followedUrls}})).map(({topic}) => topic.url)
   rows = rows.concat(foafUrls)
 
+  // eleminate duplicates
+  rows = Array.from(new Set(rows))
+
   // assemble into list
   var start = user.crawlSelectorCursor || 0
   if (start > rows.length) start = 0
   var end = start + NUM_SIMULTANEOUS_CRAWLS
   var nextCrawlTargets = rows.slice(start, end)
   var numRemaining = NUM_SIMULTANEOUS_CRAWLS - nextCrawlTargets.length
-  if (numRemaining && rows.length > NUM_SIMULTANEOUS_CRAWLS) {
+  if (numRemaining && rows.length >= NUM_SIMULTANEOUS_CRAWLS) {
     // wrap around
     nextCrawlTargets = nextCrawlTargets.concat(rows.slice(0, numRemaining))
     user.crawlSelectorCursor = numRemaining
@@ -283,12 +373,14 @@ async function fetchUserInfo (user) {
   var urlp = new URL(user.url)
   var meta = await archivesDb.getMeta(urlp.hostname)
   return {
+    label: user.label,
     url: normalizeUrl(user.url),
     archive: user.archive,
     isDefault: user.isDefault,
+    isTemporary: user.isTemporary,
     title: meta.title,
     description: meta.description,
-    createdAt: user.createdAt
+    createdAt: new Date(user.createdAt)
   }
 }
 
diff --git a/web-apis/bg.js b/web-apis/bg.js
index a9f4700c..801912d3 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -12,6 +12,7 @@ const sitedataManifest = require('./manifests/internal/sitedata')
 const watchlistManifest = require('./manifests/internal/watchlist')
 const templatesManifest = require('./manifests/internal/templates')
 const crawlerManifest = require('./manifests/internal/crawler')
+const usersManifest = require('./manifests/internal/users')
 
 // internal apis
 const loggerAPI = require('../logger').WEBAPI
@@ -21,6 +22,7 @@ const sitedataAPI = require('../dbs/sitedata').WEBAPI
 const watchlistAPI = require('./bg/watchlist')
 const templatesAPI = require('./bg/templates')
 const crawlerAPI = require('../crawler').WEBAPI
+const usersAPI = require('./bg/users')
 
 // external manifests
 const navigatorManifest = require('./manifests/external/navigator')
@@ -80,6 +82,7 @@ exports.setup = function () {
   globals.rpcAPI.exportAPI('watchlist', watchlistManifest, watchlistAPI, internalOnly)
   globals.rpcAPI.exportAPI('templates', templatesManifest, templatesAPI, internalOnly)
   globals.rpcAPI.exportAPI('crawler', crawlerManifest, crawlerAPI, internalOnly)
+  globals.rpcAPI.exportAPI('users', usersManifest, usersAPI, internalOnly)
 
   // external apis
   globals.rpcAPI.exportAPI('navigator', navigatorManifest, navigatorAPI, secureOnly)
diff --git a/web-apis/bg/users.js b/web-apis/bg/users.js
new file mode 100644
index 00000000..d30e577d
--- /dev/null
+++ b/web-apis/bg/users.js
@@ -0,0 +1,203 @@
+const globals = require('../../globals')
+const users = require('../../users')
+const dat = require('../../dat')
+
+// typedefs
+// =
+
+/**
+ * @typedef {import('../../users').User} User
+ *
+ * @typedef {Object} WebAPIUser
+ * @prop {string} label
+ * @prop {string} url
+ * @prop {boolean} isDefault
+ * @prop {boolean} isTemporary
+ * @prop {boolean} isCurrent
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {string} createdAt
+ */
+
+// exported api
+// =
+
+module.exports = {
+  /**
+   * @returns {Promise<WebAPIUser[]>}
+   */
+  async list () {
+    var sessionUrl = getSessionUrl(this.sender)
+    var records = await users.list()
+    return records.map(record => massageUserRecord(record, sessionUrl))
+  },
+
+  /**
+   * @param {string} url
+   * @returns {Promise<WebAPIUser>}
+   */
+  async get (url) {
+    var sessionUrl = getSessionUrl(this.sender)
+    return massageUserRecord(await users.get(url), sessionUrl)
+  },
+
+  /**
+   * @returns {Promise<WebAPIUser>}
+   */
+  async getCurrent () {
+    var sessionUrl = getSessionUrl(this.sender)
+    return massageUserRecord(await users.get(sessionUrl), sessionUrl)
+  },
+
+  /**
+   * @returns {Promise<WebAPIUser>}
+   */
+  async getDefault () {
+    var sessionUrl = getSessionUrl(this.sender)
+    return massageUserRecord(await users.getDefault(), sessionUrl)
+  },
+
+  /**
+   * @param {Object} opts
+   * @param {string} opts.label
+   * @param {boolean} opts.setDefault
+   * @param {string} opts.title
+   * @param {string} opts.description
+   * @param {string} opts.thumbBase64
+   * @param {string} opts.thumbExt
+   * @returns {Promise<WebAPIUser>}
+   */
+  async create (opts) {
+    var sessionUrl = getSessionUrl(this.sender)
+
+    // validate
+    users.validateUserLabel(opts.label)
+
+    // create new dat archive
+    var url = await dat.library.createNewArchive({
+      type: 'unwalled.garden/person',
+      title: opts.title,
+      description: opts.description
+    })
+    var archive = dat.library.getArchive(url)
+
+    // write thumbnail
+    if (opts.thumbBase64) {
+      await writeThumbnail(archive, opts.thumbBase64, opts.thumbExt)
+    }
+
+    // save user
+    return massageUserRecord(await users.add(opts.label, url), sessionUrl)
+  },
+
+  /**
+   * @returns {Promise<WebAPIUser>}
+   */
+  async createTemporary () {
+    var sessionUrl = getSessionUrl(this.sender)
+
+    // create new dat archive
+    var url = await dat.library.createNewArchive({
+      type: 'unwalled.garden/person',
+      title: 'Temporary User',
+      description: 'Created ' + (new Date()).toLocaleString()
+    })
+
+    // save user
+    return massageUserRecord(await users.add(`temp-${Date.now()}`, url, false, true), sessionUrl)
+  },
+
+  /**
+   * @param {string} label
+   * @param {string} url
+   * @returns {Promise<WebAPIUser>}
+   */
+  async add (label, url) {
+    var sessionUrl = getSessionUrl(this.sender)
+    return massageUserRecord(await users.add(label, url), sessionUrl)
+  },
+
+  /**
+   * @param {string} url
+   * @param {Object} opts
+   * @param {string} [opts.label]
+   * @param {boolean} [opts.setDefault]
+   * @param {string} [opts.title]
+   * @param {string} [opts.description]
+   * @param {string} [opts.thumbBase64]
+   * @param {string} [opts.thumbExt]
+   * @returns {Promise<WebAPIUser>}
+   */
+  async edit (url, opts) {
+    var sessionUrl = getSessionUrl(this.sender)
+
+    // validate
+    if (opts.label) users.validateUserLabel(opts.label)
+
+    // fetch user
+    var user = await users.get(url)
+    if (!user) return
+
+    // update archive
+    if (('title' in opts) || ('description' in opts)) {
+      let cfg = {}
+      if ('title' in opts) cfg.title = opts.title
+      if ('description' in opts) cfg.description = opts.description
+      await user.archive.pda.updateManifest(cfg)
+    }
+
+    // update thumbnail
+    if (('thumbBase64' in opts)) {
+      await writeThumbnail(user.archive, opts.thumbBase64, opts.thumbExt)
+    }
+
+    // update user
+    await users.edit(url, opts)
+    return massageUserRecord(await users.get(url), sessionUrl)
+  },
+
+  /**
+   * @param {string} url
+   * @returns {Promise<void>}
+   */
+  async remove (url) {
+    return users.remove(url)
+  }
+}
+
+// internal methods
+// =
+
+function getSessionUrl (sender) {
+  var userSession = globals.userSessionAPI.getFor(sender)
+  if (!userSession) throw new Error('No active user session')
+  return userSession.url
+}
+
+async function writeThumbnail (archive, base64, ext) {
+  // remove any existing
+  await Promise.all([
+    archive.pda.unlink('/thumb.jpg').catch(err => {}),
+    archive.pda.unlink('/thumb.jpeg').catch(err => {}),
+    archive.pda.unlink('/thumb.png').catch(err => {})
+  ])
+  // write new
+  await archive.pda.writeFile(`/thumb.${ext || 'png'}`, base64, 'base64')
+}
+
+/**
+ * @param {User} record
+ * @returns {WebAPIUser}
+ */
+function massageUserRecord (record, sessionUrl) {
+  return {
+    label: record.label,
+    url: record.url,
+    isDefault: record.isDefault,
+    isTemporary: record.isTemporary,
+    isCurrent: record.url === sessionUrl,
+    title: record.title,
+    description: record.description,
+    createdAt: record.createdAt.toISOString()
+  }
+}
\ No newline at end of file
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index 114f31ce..abcbe648 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -10,6 +10,7 @@ const sitedataManifest = require('../manifests/internal/sitedata')
 const watchlistManifest = require('../manifests/internal/watchlist')
 const templatesManifest = require('../manifests/internal/templates')
 const crawlerManifest = require('../manifests/internal/crawler')
+const usersManifest = require('../manifests/internal/users')
 
 exports.setup = function (rpc) {
   const beaker = {}
@@ -26,6 +27,7 @@ exports.setup = function (rpc) {
     const watchlistRPC = rpc.importAPI('watchlist', watchlistManifest, opts)
     const templatesRPC = rpc.importAPI('templates', templatesManifest, opts)
     const crawlerRPC = rpc.importAPI('crawler', crawlerManifest, opts)
+    const usersRPC = rpc.importAPI('users', usersManifest, opts)
 
     // beaker.logger
     beaker.logger = {}
@@ -96,7 +98,7 @@ exports.setup = function (rpc) {
     beaker.browser.setWindowDimensions = beakerBrowserRPC.setWindowDimensions
     beaker.browser.showOpenDialog = beakerBrowserRPC.showOpenDialog
     beaker.browser.showContextMenu = beakerBrowserRPC.showContextMenu
-    beaker.browser.showShellModal = beakerBrowserRPC.showShellModal
+    beaker.browser.showModal = beakerBrowserRPC.showModal
     beaker.browser.openUrl = beakerBrowserRPC.openUrl
     beaker.browser.openFolder = beakerBrowserRPC.openFolder
     beaker.browser.doWebcontentsCmd = beakerBrowserRPC.doWebcontentsCmd
@@ -158,6 +160,18 @@ exports.setup = function (rpc) {
     beaker.crawler.crawlSite = crawlerRPC.crawlSite
     beaker.crawler.resetSite = crawlerRPC.resetSite
     beaker.crawler.createEventsStream = () => fromEventStream(crawlerRPC.createEventsStream())
+
+    // beaker.users
+    beaker.users = {}
+    beaker.users.list = usersRPC.list
+    beaker.users.get = usersRPC.get
+    beaker.users.getCurrent = usersRPC.getCurrent
+    beaker.users.getDefault = usersRPC.getDefault
+    beaker.users.create = usersRPC.create
+    beaker.users.createTemporary = usersRPC.createTemporary
+    beaker.users.add = usersRPC.add
+    beaker.users.edit = usersRPC.edit
+    beaker.users.remove = usersRPC.remove
   }
 
   return beaker
diff --git a/web-apis/manifests/internal/browser.js b/web-apis/manifests/internal/browser.js
index 7eb661cb..4d32fa28 100644
--- a/web-apis/manifests/internal/browser.js
+++ b/web-apis/manifests/internal/browser.js
@@ -33,7 +33,7 @@ module.exports = {
   setWindowDimensions: 'promise',
   showOpenDialog: 'promise',
   showContextMenu: 'promise',
-  showShellModal: 'promise',
+  showModal: 'promise',
   openUrl: 'promise',
   openFolder: 'promise',
   doWebcontentsCmd: 'promise',
diff --git a/web-apis/manifests/internal/users.js b/web-apis/manifests/internal/users.js
index bdc4add0..1d516ef5 100644
--- a/web-apis/manifests/internal/users.js
+++ b/web-apis/manifests/internal/users.js
@@ -1,7 +1,11 @@
 module.exports = {
   list: 'promise',
   get: 'promise',
+  getCurrent: 'promise',
   getDefault: 'promise',
+  create: 'promise',
+  createTemporary: 'promise',
   add: 'promise',
+  edit: 'promise',
   remove: 'promise'
 }

From b80bdb60a756f775e0b9e38b15fd2963ce4d1c7e Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 2 Jul 2019 14:43:20 -0500
Subject: [PATCH 205/245] Switch back to main spellchecker (it's working
 again!)

---
 package-lock.json | 14 +++++++++++---
 package.json      |  2 +-
 2 files changed, 12 insertions(+), 4 deletions(-)

diff --git a/package-lock.json b/package-lock.json
index a6e7d6b1..e57799e2 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -4272,11 +4272,19 @@
       "integrity": "sha512-z/wAiTESw2XVPssY2XRcme4niTc4S5FkkJ4gknudtVoc33Zil8TdTxHy5torRcgqMqksJV2Yz8HQcvtbsnw0mQ=="
     },
     "spellchecker": {
-      "version": "github:beakerbrowser/node-spellchecker#ce6402cb062823587986f3cd38debd01ddf3bffb",
-      "from": "github:beakerbrowser/node-spellchecker#ce6402cb062823587986f3cd38debd01ddf3bffb",
+      "version": "3.6.1",
+      "resolved": "https://registry.npmjs.org/spellchecker/-/spellchecker-3.6.1.tgz",
+      "integrity": "sha512-i7qp5m/JpZqs+3LanJW6hhlXTX/m9+x8jvZvOuG/V3XlWHLsCsJQdOvGAXIU8ZHA1wuv1VRPJLpfVI8/e/ZBOg==",
       "requires": {
         "any-promise": "^1.3.0",
-        "nan": "^2.10.0"
+        "nan": "^2.14.0"
+      },
+      "dependencies": {
+        "nan": {
+          "version": "2.14.0",
+          "resolved": "https://registry.npmjs.org/nan/-/nan-2.14.0.tgz",
+          "integrity": "sha512-INOFj37C7k3AfaNTtX8RhsTw7qRy7eLET14cROi9+5HAVbbHuIWUHEauBv5qT4Av2tWasiTY1Jw6puUNqRJXQg=="
+        }
       }
     },
     "split-string": {
diff --git a/package.json b/package.json
index cf07f5c5..d1b798b1 100644
--- a/package.json
+++ b/package.json
@@ -81,7 +81,7 @@
     "semver": "^5.7.0",
     "slugify": "^1.3.4",
     "sodium-signatures": "^2.1.1",
-    "spellchecker": "github:beakerbrowser/node-spellchecker#ce6402cb062823587986f3cd38debd01ddf3bffb",
+    "spellchecker": "^3.6.1",
     "split2": "^2.2.0",
     "sqlite3": "^4.0.9",
     "stream-throttle": "^0.1.3",

From 15e962686a45e7b1897151409e32d77983952452 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 4 Jul 2019 13:34:56 -0500
Subject: [PATCH 206/245] Add installed-applications table and internal web api

---
 dbs/profile-data-db.js                      |   3 +-
 dbs/schemas/profile-data.sql.js             |  17 +-
 dbs/schemas/profile-data.v34.sql.js         |  15 ++
 dbs/sitedata.js                             |  34 ++--
 lib/app-perms.js                            |  69 ++++++++
 web-apis/bg.js                              |   3 +
 web-apis/bg/applications.js                 | 183 ++++++++++++++++++++
 web-apis/fg/beaker.js                       |  11 ++
 web-apis/manifests/internal/applications.js |   8 +
 9 files changed, 325 insertions(+), 18 deletions(-)
 create mode 100644 dbs/schemas/profile-data.v34.sql.js
 create mode 100644 lib/app-perms.js
 create mode 100644 web-apis/bg/applications.js
 create mode 100644 web-apis/manifests/internal/applications.js

diff --git a/dbs/profile-data-db.js b/dbs/profile-data-db.js
index 44f79696..5b72d26f 100644
--- a/dbs/profile-data-db.js
+++ b/dbs/profile-data-db.js
@@ -120,7 +120,8 @@ migrations = [
   migration('profile-data.v30.sql'),
   migration('profile-data.v31.sql'),
   migration('profile-data.v32.sql'),
-  migration('profile-data.v33.sql')
+  migration('profile-data.v33.sql'),
+  migration('profile-data.v34.sql')
 ]
 function migration (file, opts = {}) {
   return cb => {
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index 1d0c0933..ff44604f 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -90,6 +90,17 @@ CREATE TABLE visit_stats (
 CREATE VIRTUAL TABLE visit_fts USING fts4 (url, title);
 CREATE UNIQUE INDEX visits_stats_url ON visit_stats (url);
 
+-- list of the users installed apps
+CREATE TABLE installed_applications (
+  id INTEGER PRIMARY KEY NOT NULL,
+  userId INTEGER NOT NULL,
+  enabled INTEGER DEFAULT 1,
+  url TEXT,
+  createdAt INTEGER,
+ 
+  FOREIGN KEY (userId) REFERENCES users (id) ON DELETE CASCADE
+);
+
 -- list of dats being looked for
 CREATE TABLE watchlist (
   profileId INTEGER NOT NULL,
@@ -394,7 +405,7 @@ CREATE TABLE archive_drafts (
 );
 
 -- list of the users installed apps
--- deprecated (may return)
+-- deprecated
 CREATE TABLE apps (
   profileId INTEGER NOT NULL,
   name TEXT NOT NULL,
@@ -407,7 +418,7 @@ CREATE TABLE apps (
 );
 
 -- log of the users app installations
--- deprecated (may return)
+-- deprecated
 CREATE TABLE apps_log (
   profileId INTEGER NOT NULL,
   name TEXT NOT NULL,
@@ -443,5 +454,5 @@ INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Library', 'beaker://library/', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker.Social', 'dat://beaker.social', 1);
 
-PRAGMA user_version = 33;
+PRAGMA user_version = 34;
 `
diff --git a/dbs/schemas/profile-data.v34.sql.js b/dbs/schemas/profile-data.v34.sql.js
new file mode 100644
index 00000000..a3a6741a
--- /dev/null
+++ b/dbs/schemas/profile-data.v34.sql.js
@@ -0,0 +1,15 @@
+module.exports = `
+
+-- list of the users installed apps
+CREATE TABLE installed_applications (
+  id INTEGER PRIMARY KEY NOT NULL,
+  userId INTEGER NOT NULL,
+  enabled INTEGER DEFAULT 1,
+  url TEXT,
+  createdAt INTEGER,
+ 
+  FOREIGN KEY (userId) REFERENCES users (id) ON DELETE CASCADE
+);
+
+PRAGMA user_version = 34;
+`
\ No newline at end of file
diff --git a/dbs/sitedata.js b/dbs/sitedata.js
index 2799eaf2..f3b81d13 100644
--- a/dbs/sitedata.js
+++ b/dbs/sitedata.js
@@ -82,6 +82,15 @@ const get = exports.get = async function (url, key, opts) {
   })
 }
 
+/**
+ * @param {string} url
+ * @param {string} key
+ * @returns {Promise<string>}
+ */
+const getPermission = exports.getPermission = function (url, key) {
+  return get(url, 'perm:' + key)
+}
+
 /**
  * @param {string} url
  * @returns {Promise<Object>}
@@ -143,9 +152,8 @@ const getAppPermissions = exports.getAppPermissions = async function (url) {
       var appPerms = {}
       if (rows) {
         rows.forEach(row => {
-          let [api, perm] = row.key.split(':').slice(2)
-          if (!appPerms[api]) appPerms[api] = []
-          appPerms[api].push(perm)
+          let [perm] = row.key.split(':').slice(2)
+          appPerms[perm] = row.value.split(',')
         })
       }
       cb(null, appPerms)
@@ -155,11 +163,13 @@ const getAppPermissions = exports.getAppPermissions = async function (url) {
 
 /**
  * @param {string} url
- * @param {string} key
- * @returns {Promise<string>}
+ * @returns {Promise<Object>}
  */
-const getPermission = exports.getPermission = function (url, key) {
-  return get(url, 'perm:' + key)
+const getAppPermission = exports.getAppPermission = async function (url, key) {
+  await setupPromise
+  var perm = await get(url, 'perm:app:' + key)
+  if (!perm) return []
+  return perm.split(',')
 }
 
 /**
@@ -192,13 +202,8 @@ const setAppPermissions = exports.setAppPermissions = async function (url, appPe
   })
 
   // set perms given
-  for (let api in appPerms) {
-    if (!Array.isArray(appPerms[api])) {
-      continue
-    }
-    for (let perm of appPerms[api]) {
-      await set(url, `perm:app:${api}:${perm}`, 1)
-    }
+  for (let perm in appPerms) {
+    await set(url, `perm:app:${perm}`, Array.isArray(appPerms[perm]) ? appPerms[perm].join(',') : appPerms[perm])
   }
 }
 
@@ -231,6 +236,7 @@ exports.WEBAPI = {
   getPermissions,
   getPermission,
   getAppPermissions,
+  getAppPermission,
   setPermission,
   setAppPermissions,
   clearPermission,
diff --git a/lib/app-perms.js b/lib/app-perms.js
new file mode 100644
index 00000000..7c04c01d
--- /dev/null
+++ b/lib/app-perms.js
@@ -0,0 +1,69 @@
+const sitedataDb = require('../dbs/sitedata')
+const { PermissionsError } = require('beaker-error-constants')
+
+/**
+ * @param {Object} sender
+ * @param {string} perm eg 'unwalled.garden/perm/comments'
+ * @param {string} cap eg 'read' or 'write'
+ * @returns {Promise<boolean>}
+ */
+const can = exports.can = async function (sender, perm, cap) {
+  if (sender.getURL().startsWith('beaker:')) {
+    return true
+  }
+  return (await sitedataDb.getAppPermission(sender.getURL(), perm)).includes(cap)
+}
+
+/**
+ * @param {Object} sender
+ * @returns {Promise<void>}
+ */
+const assertInstalled = exports.assertInstalled = async function (sender) {
+  if (sender.getURL().startsWith('beaker:')) return
+  // TODO
+}
+
+/**
+ * @param {Object} sender
+ * @param {string} perm eg 'unwalled.garden/perm/comments'
+ * @param {string} cap eg 'read' or 'write'
+ * @returns {Promise<void>}
+ */
+const assertCan = exports.assertCan = async function (sender, perm, cap) {
+  if (sender.getURL().startsWith('beaker:')) return
+  await assertInstalled(sender)
+  if (!can(sender, cap, perm)) throw new PermissionsError()
+}
+
+/**
+ * @param {string} perm
+ * @param {string[]} caps
+ * @returns {string}
+ */
+const describePerm = exports.describePerm = function (perm, caps) {
+  var capsStr = 'Read'
+  if (caps.includes('write')) capsStr = 'Read, create, and modify'
+  switch (perm) {
+    case 'unwalled.garden/perm/follows':
+      if (caps.includes('write')) return 'Follow and unfollow sites'
+      return 'See who you are following'
+    case 'unwalled.garden/perm/posts':
+      if (caps.includes('write')) return 'Post to your feed'
+      return `Read posts on your feed`
+    case 'unwalled.garden/perm/bookmarks':
+      return `${capsStr} bookmarks`
+    case 'unwalled.garden/perm/comments':
+      return `${capsStr} comments`
+    case 'unwalled.garden/perm/discussions':
+      return `${capsStr} discussions`
+    case 'unwalled.garden/perm/media':
+      return `${capsStr} media`
+    case 'unwalled.garden/perm/reactions':
+      return `${capsStr} reactions`
+    case 'unwalled.garden/perm/sitelists':
+      return `${capsStr} site-lists`
+    case 'unwalled.garden/perm/votes':
+      return `${capsStr} votes`
+  }
+  return false
+}
\ No newline at end of file
diff --git a/web-apis/bg.js b/web-apis/bg.js
index 801912d3..85347d87 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -4,6 +4,7 @@ const SECURE_ORIGIN_REGEX = /^(beaker:|dat:|https:|http:\/\/localhost(\/|:))/i
 
 // internal manifests
 const loggerManifest = require('./manifests/internal/logger')
+const applicationsManifest = require('./manifests/internal/applications')
 const archivesManifest = require('./manifests/internal/archives')
 const beakerBrowserManifest = require('./manifests/internal/browser')
 const downloadsManifest = require('./manifests/internal/downloads')
@@ -16,6 +17,7 @@ const usersManifest = require('./manifests/internal/users')
 
 // internal apis
 const loggerAPI = require('../logger').WEBAPI
+const applicationsAPI = require('./bg/applications')
 const archivesAPI = require('./bg/archives')
 const historyAPI = require('./bg/history')
 const sitedataAPI = require('../dbs/sitedata').WEBAPI
@@ -74,6 +76,7 @@ const experimentalGlobalFetchAPI = require('./bg/experimental/global-fetch')
 exports.setup = function () {
   // internal apis
   globals.rpcAPI.exportAPI('logger', loggerManifest, loggerAPI, internalOnly)
+  globals.rpcAPI.exportAPI('applications', applicationsManifest, applicationsAPI, internalOnly)
   globals.rpcAPI.exportAPI('archives', archivesManifest, archivesAPI, internalOnly)
   globals.rpcAPI.exportAPI('beaker-browser', beakerBrowserManifest, globals.browserWebAPI, internalOnly)
   globals.rpcAPI.exportAPI('downloads', downloadsManifest, globals.downloadsWebAPI, internalOnly)
diff --git a/web-apis/bg/applications.js b/web-apis/bg/applications.js
new file mode 100644
index 00000000..84e9000d
--- /dev/null
+++ b/web-apis/bg/applications.js
@@ -0,0 +1,183 @@
+const {URL} = require('url')
+const globals = require('../../globals')
+const dat = require('../../dat')
+const appPerms = require('../../lib/app-perms')
+const sitedataDb = require('../../dbs/sitedata')
+const knex = require('../../lib/knex')
+const db = require('../../dbs/profile-data-db')
+
+// typedefs
+// =
+
+/**
+ * @typedef {import('../../users').User} User
+ *
+ * @typedef {Object} WebAPIApplicationPermission
+ * @prop {string} id
+ * @prop {string[]} caps
+ * @prop {string} description
+ *
+ * @typedef {Object} WebAPIApplication
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {WebAPIApplicationPermission[]} permissions
+ * @prop {boolean} installed
+ * @prop {boolean} enabled
+ * @prop {string} installedAt
+ */
+
+// exported api
+// =
+
+module.exports = {
+  /**
+   * @param {string} url
+   * @returns {Promise<WebAPIApplication>}
+   */
+  async getInfo (url) {
+    url = await toDatOrigin(url)
+    var archiveInfo = await dat.library.getArchiveInfo(url)
+    return massageArchiveInfo(archiveInfo)
+  },
+
+  /**
+   * @param {string} url
+   * @returns {Promise<void>}
+   */
+  async install (url) {
+    url = await toDatOrigin(url)
+    var userId = await getSessionUserId(this.sender)
+    var archiveInfo = await dat.library.getArchiveInfo(url)
+    var record = await db.get(knex('installed_applications').where({userId, url}))
+    if (!record) {
+      await db.run(knex('installed_applications').insert({
+        userId,
+        enabled: 1,
+        url,
+        createdAt: Date.now()
+      }))
+    }
+    await sitedataDb.setAppPermissions(url, getArchivePerms(archiveInfo))
+  },
+
+  /**
+   * @returns {Promise<WebAPIApplication[]>}
+   */
+  async list () {
+    var userId = await getSessionUserId(this.sender)
+    var records = await db.all(knex('installed_applications').where({userId}))
+    await Promise.all(records.map(async (record) => {
+      var archiveInfo = await dat.library.getArchiveInfo(record.url)
+      record.title = archiveInfo.title
+      record.description = archiveInfo.description
+      record.permissions = await sitedataDb.getAppPermissions(record.url)
+    }))
+    return records.map(massageAppRecord)
+  },
+
+  /**
+   * @param {string} url
+   * @returns {Promise<void>}
+   */
+  async enable (url) {
+    url = await toDatOrigin(url)
+    var userId = await getSessionUserId(this.sender)
+    await db.run(knex('installed_applications').update({enabled: 1}).where({userId, url}))
+  },
+
+  /**
+   * @param {string} url
+   * @returns {Promise<void>}
+   */
+  async disable (url) {
+    url = await toDatOrigin(url)
+    var userId = await getSessionUserId(this.sender)
+    await db.run(knex('installed_applications').update({enabled: 0}).where({userId, url}))
+  },
+
+  /**
+   * @param {string} url
+   * @returns {Promise<void>}
+   */
+  async uninstall (url) {
+    url = await toDatOrigin(url)
+    var userId = await getSessionUserId(this.sender)
+    await db.run(knex('installed_applications').delete().where({userId, url}))
+  }
+}
+
+// internal methods
+// =
+
+/**
+ * @param {string} url
+ * @returns {Promise<string>}
+ */
+async function toDatOrigin (url) {
+  try {
+    var urlParsed = new URL(url)
+  } catch (e) {
+    throw new Error('Invalid URL: ' + url)
+  }
+  if (urlParsed.protocol !== 'dat:') throw new Error('Can only install dat applications')
+  urlParsed.hostname = await dat.dns.resolveName(urlParsed.hostname)
+  return urlParsed.protocol + '//' + urlParsed.hostname
+}
+
+async function getSessionUserId (sender) {
+  var userSession = globals.userSessionAPI.getFor(sender)
+  if (!userSession) throw new Error('No active user session')
+  var record = await db.get(knex('users').where({url: userSession.url}))
+  return record.id
+}
+
+function getArchivePerms (archiveInfo) {
+  try {
+    return archiveInfo.manifest['unwalled.garden/application'].permissions
+  } catch (e) {
+    console.debug('No permissions found on application', archiveInfo.manifest)
+    return []
+  }
+}
+
+/**
+ * @param {Object} archiveInfo
+ * @param {Object} record
+ * @returns {WebAPIApplication}
+ */
+function massageArchiveInfo (archiveInfo, record) {
+  return {
+    url: archiveInfo.url,
+    title: archiveInfo.title,
+    description: archiveInfo.description,
+    permissions: Object.entries(getArchivePerms(archiveInfo)).map(([id, caps]) => ({
+      id,
+      caps,
+      description: appPerms.describePerm(id, caps)
+    })),
+    installed: !!record,
+    enabled: Boolean(record && record.enabled),
+    installedAt: record ? (new Date(record.createdAt)).toISOString() : null
+  }
+}
+
+/**
+ * @param {Object} record
+ * @returns {WebAPIApplication}
+ */
+function massageAppRecord (record) {
+  return {
+    url: record.url,
+    title: record.title,
+    description: record.description,
+    permissions: Object.entries(record.permissions).map(([id, caps]) => ({
+      id,
+      caps,
+      description: appPerms.describePerm(id, caps)
+    })),
+    installed: true,
+    enabled: Boolean(record.enabled),
+    installedAt: (new Date(record.createdAt)).toISOString()
+  }
+}
\ No newline at end of file
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index abcbe648..11199825 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -2,6 +2,7 @@ const { EventTarget, bindEventStream, fromEventStream } = require('./event-targe
 const errors = require('beaker-error-constants')
 
 const loggerManifest = require('../manifests/internal/logger')
+const applicationsManifest = require('../manifests/internal/applications')
 const archivesManifest = require('../manifests/internal/archives')
 const beakerBrowserManifest = require('../manifests/internal/browser')
 const downloadsManifest = require('../manifests/internal/downloads')
@@ -19,6 +20,7 @@ exports.setup = function (rpc) {
   // internal only
   if (window.location.protocol === 'beaker:') {
     const loggerRPC = rpc.importAPI('logger', loggerManifest, opts)
+    const applicationsRPC = rpc.importAPI('applications', applicationsManifest, opts)
     const archivesRPC = rpc.importAPI('archives', archivesManifest, opts)
     const beakerBrowserRPC = rpc.importAPI('beaker-browser', beakerBrowserManifest, opts)
     const downloadsRPC = rpc.importAPI('downloads', downloadsManifest, opts)
@@ -34,6 +36,15 @@ exports.setup = function (rpc) {
     beaker.logger.stream = (opts) => fromEventStream(loggerRPC.stream(opts))
     beaker.logger.query = loggerRPC.query
 
+    // beaker.applications
+    beaker.applications = {}
+    beaker.applications.getInfo = applicationsRPC.getInfo
+    beaker.applications.install = applicationsRPC.install
+    beaker.applications.list = applicationsRPC.list
+    beaker.applications.enable = applicationsRPC.enable
+    beaker.applications.disable = applicationsRPC.disable
+    beaker.applications.uninstall = applicationsRPC.uninstall
+
     // beaker.archives
     beaker.archives = new EventTarget()
     beaker.archives.status = archivesRPC.status
diff --git a/web-apis/manifests/internal/applications.js b/web-apis/manifests/internal/applications.js
new file mode 100644
index 00000000..d156faf0
--- /dev/null
+++ b/web-apis/manifests/internal/applications.js
@@ -0,0 +1,8 @@
+module.exports = {
+  getInfo: 'promise',
+  install: 'promise',
+  list: 'promise',
+  enable: 'promise',
+  disable: 'promise',
+  uninstall: 'promise',
+}

From 8471c67eee478be3641f9f3854bf801a5055f980 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 4 Jul 2019 13:47:29 -0500
Subject: [PATCH 207/245] Fix to app permissions check

---
 lib/app-perms.js | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/lib/app-perms.js b/lib/app-perms.js
index 7c04c01d..38f43b89 100644
--- a/lib/app-perms.js
+++ b/lib/app-perms.js
@@ -32,7 +32,9 @@ const assertInstalled = exports.assertInstalled = async function (sender) {
 const assertCan = exports.assertCan = async function (sender, perm, cap) {
   if (sender.getURL().startsWith('beaker:')) return
   await assertInstalled(sender)
-  if (!can(sender, cap, perm)) throw new PermissionsError()
+  if (!(await can(sender, perm, cap))) {
+    throw new PermissionsError()
+  }
 }
 
 /**

From 83b9e88d89b2541eef2526e87e988c54a1d6641b Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 4 Jul 2019 14:40:13 -0500
Subject: [PATCH 208/245] Add 'is installed and enabled' check to app perms

---
 lib/app-perms.js            | 35 +++++++++++++++++++++++++-
 web-apis/bg/applications.js | 49 +++++++++++--------------------------
 2 files changed, 48 insertions(+), 36 deletions(-)

diff --git a/lib/app-perms.js b/lib/app-perms.js
index 38f43b89..a51c9763 100644
--- a/lib/app-perms.js
+++ b/lib/app-perms.js
@@ -1,6 +1,34 @@
+const {URL} = require('url')
+const dat = require('../dat')
 const sitedataDb = require('../dbs/sitedata')
+const globals = require('../globals')
+const knex = require('../lib/knex')
+const db = require('../dbs/profile-data-db')
 const { PermissionsError } = require('beaker-error-constants')
 
+const getSessionUserId = exports.getSessionUserId = async function (sender) {
+  var userSession = globals.userSessionAPI.getFor(sender)
+  if (!userSession) throw new Error('No active user session')
+  var record = await db.get(knex('users').where({url: userSession.url}))
+  return record.id
+}
+
+
+/**
+ * @param {string} url
+ * @returns {Promise<string>}
+ */
+const toDatOrigin = exports.toDatOrigin = async function (url) {
+  try {
+    var urlParsed = new URL(url)
+  } catch (e) {
+    throw new Error('Invalid URL: ' + url)
+  }
+  if (urlParsed.protocol !== 'dat:') throw new Error('Can only install dat applications')
+  urlParsed.hostname = await dat.dns.resolveName(urlParsed.hostname)
+  return urlParsed.protocol + '//' + urlParsed.hostname
+}
+
 /**
  * @param {Object} sender
  * @param {string} perm eg 'unwalled.garden/perm/comments'
@@ -20,7 +48,12 @@ const can = exports.can = async function (sender, perm, cap) {
  */
 const assertInstalled = exports.assertInstalled = async function (sender) {
   if (sender.getURL().startsWith('beaker:')) return
-  // TODO
+  var userId = await getSessionUserId(sender)
+  var record = await db.get(knex('installed_applications').where({userId, url: await toDatOrigin(sender.getURL())}))
+  console.log(record)
+  if (!(record && record.enabled != 0)) {
+    throw new PermissionsError()
+  }
 }
 
 /**
diff --git a/web-apis/bg/applications.js b/web-apis/bg/applications.js
index 84e9000d..c52c88af 100644
--- a/web-apis/bg/applications.js
+++ b/web-apis/bg/applications.js
@@ -1,5 +1,3 @@
-const {URL} = require('url')
-const globals = require('../../globals')
 const dat = require('../../dat')
 const appPerms = require('../../lib/app-perms')
 const sitedataDb = require('../../dbs/sitedata')
@@ -36,9 +34,11 @@ module.exports = {
    * @returns {Promise<WebAPIApplication>}
    */
   async getInfo (url) {
-    url = await toDatOrigin(url)
+    url = await appPerms.toDatOrigin(url)
+    var userId = await appPerms.getSessionUserId(this.sender)
+    var record = await db.get(knex('installed_applications').where({userId, url}))
     var archiveInfo = await dat.library.getArchiveInfo(url)
-    return massageArchiveInfo(archiveInfo)
+    return massageArchiveInfo(archiveInfo, record)
   },
 
   /**
@@ -46,8 +46,8 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async install (url) {
-    url = await toDatOrigin(url)
-    var userId = await getSessionUserId(this.sender)
+    url = await appPerms.toDatOrigin(url)
+    var userId = await appPerms.getSessionUserId(this.sender)
     var archiveInfo = await dat.library.getArchiveInfo(url)
     var record = await db.get(knex('installed_applications').where({userId, url}))
     if (!record) {
@@ -65,7 +65,7 @@ module.exports = {
    * @returns {Promise<WebAPIApplication[]>}
    */
   async list () {
-    var userId = await getSessionUserId(this.sender)
+    var userId = await appPerms.getSessionUserId(this.sender)
     var records = await db.all(knex('installed_applications').where({userId}))
     await Promise.all(records.map(async (record) => {
       var archiveInfo = await dat.library.getArchiveInfo(record.url)
@@ -81,8 +81,8 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async enable (url) {
-    url = await toDatOrigin(url)
-    var userId = await getSessionUserId(this.sender)
+    url = await appPerms.toDatOrigin(url)
+    var userId = await appPerms.getSessionUserId(this.sender)
     await db.run(knex('installed_applications').update({enabled: 1}).where({userId, url}))
   },
 
@@ -91,8 +91,8 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async disable (url) {
-    url = await toDatOrigin(url)
-    var userId = await getSessionUserId(this.sender)
+    url = await appPerms.toDatOrigin(url)
+    var userId = await appPerms.getSessionUserId(this.sender)
     await db.run(knex('installed_applications').update({enabled: 0}).where({userId, url}))
   },
 
@@ -101,8 +101,9 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async uninstall (url) {
-    url = await toDatOrigin(url)
-    var userId = await getSessionUserId(this.sender)
+    url = await appPerms.toDatOrigin(url)
+    var userId = await appPerms.getSessionUserId(this.sender)
+    await sitedataDb.setAppPermissions(url, {})
     await db.run(knex('installed_applications').delete().where({userId, url}))
   }
 }
@@ -110,28 +111,6 @@ module.exports = {
 // internal methods
 // =
 
-/**
- * @param {string} url
- * @returns {Promise<string>}
- */
-async function toDatOrigin (url) {
-  try {
-    var urlParsed = new URL(url)
-  } catch (e) {
-    throw new Error('Invalid URL: ' + url)
-  }
-  if (urlParsed.protocol !== 'dat:') throw new Error('Can only install dat applications')
-  urlParsed.hostname = await dat.dns.resolveName(urlParsed.hostname)
-  return urlParsed.protocol + '//' + urlParsed.hostname
-}
-
-async function getSessionUserId (sender) {
-  var userSession = globals.userSessionAPI.getFor(sender)
-  if (!userSession) throw new Error('No active user session')
-  var record = await db.get(knex('users').where({url: userSession.url}))
-  return record.id
-}
-
 function getArchivePerms (archiveInfo) {
   try {
     return archiveInfo.manifest['unwalled.garden/application'].permissions

From 1a0cd1389794330a2d3eb03623fbda33e9a235d3 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 4 Jul 2019 15:08:36 -0500
Subject: [PATCH 209/245] Add navigator.getApplicationState and
 beaker.sitedata.getAppPermission

---
 lib/app-perms.js                         |  2 -
 web-apis/bg/navigator.js                 | 70 ++++++++++++++++++++++++
 web-apis/fg/beaker.js                    |  1 +
 web-apis/manifests/external/navigator.js |  3 +-
 web-apis/manifests/internal/sitedata.js  |  1 +
 5 files changed, 74 insertions(+), 3 deletions(-)

diff --git a/lib/app-perms.js b/lib/app-perms.js
index a51c9763..7f9b222b 100644
--- a/lib/app-perms.js
+++ b/lib/app-perms.js
@@ -13,7 +13,6 @@ const getSessionUserId = exports.getSessionUserId = async function (sender) {
   return record.id
 }
 
-
 /**
  * @param {string} url
  * @returns {Promise<string>}
@@ -50,7 +49,6 @@ const assertInstalled = exports.assertInstalled = async function (sender) {
   if (sender.getURL().startsWith('beaker:')) return
   var userId = await getSessionUserId(sender)
   var record = await db.get(knex('installed_applications').where({userId, url: await toDatOrigin(sender.getURL())}))
-  console.log(record)
   if (!(record && record.enabled != 0)) {
     throw new PermissionsError()
   }
diff --git a/web-apis/bg/navigator.js b/web-apis/bg/navigator.js
index 3235afee..ba8f1930 100644
--- a/web-apis/bg/navigator.js
+++ b/web-apis/bg/navigator.js
@@ -1,6 +1,32 @@
 const globals = require('../../globals')
 const assert = require('assert')
 const { UserDeniedError } = require('beaker-error-constants')
+const dat = require('../../dat')
+const appPerms = require('../../lib/app-perms')
+const knex = require('../../lib/knex')
+const db = require('../../dbs/profile-data-db')
+const sitedataDb = require('../../dbs/sitedata')
+
+// typedefs
+// =
+
+/**
+ * @typedef {import('../../users').User} User
+ *
+ * @typedef {Object} ApplicationPermission
+ * @prop {string} id
+ * @prop {string[]} caps
+ * @prop {string} description
+ *
+ * @typedef {Object} ApplicationState
+ * @prop {string} url
+ * @prop {string} title
+ * @prop {string} description
+ * @prop {ApplicationPermission[]} permissions
+ * @prop {boolean} installed
+ * @prop {boolean} enabled
+ * @prop {string} installedAt
+ */
 
 // exported api
 // =
@@ -138,9 +164,53 @@ module.exports = {
     }
     if (!res || !res.url) throw new UserDeniedError()
     return res.url
+  },
+
+  /**
+   * @returns {Promise<ApplicationState>}
+   */
+  async getApplicationState () {
+    var url = await appPerms.toDatOrigin(this.sender.getURL())
+    var userId = await appPerms.getSessionUserId(this.sender)
+    var archiveInfo = await dat.library.getArchiveInfo(url)
+    var record = await db.get(knex('installed_applications').where({userId, url}))
+    if (record) {
+      record.installed = true
+    } else {
+      record = {
+        url,
+        installed: false,
+        enabled: false,
+        installedAt: null
+      }
+    }
+    record.title = archiveInfo.title
+    record.description = archiveInfo.description
+    record.permissions = await sitedataDb.getAppPermissions(record.url)
+    return massageAppRecord(record)
   }
 }
 
 function isStrArray (v) {
   return (Array.isArray(v) && v.every(el => typeof el === 'string'))
+}
+
+/**
+ * @param {Object} record
+ * @returns {ApplicationState}
+ */
+function massageAppRecord (record) {
+  return {
+    url: record.url,
+    title: record.title,
+    description: record.description,
+    permissions: Object.entries(record.permissions).map(([id, caps]) => ({
+      id,
+      caps,
+      description: appPerms.describePerm(id, caps)
+    })),
+    installed: record.installed,
+    enabled: Boolean(record.enabled),
+    installedAt: record.createdAt ? (new Date(record.createdAt)).toISOString() : null
+  }
 }
\ No newline at end of file
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index 11199825..47a17818 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -143,6 +143,7 @@ exports.setup = function (rpc) {
     beaker.sitedata.set = sitedataRPC.set
     beaker.sitedata.getPermissions = sitedataRPC.getPermissions
     beaker.sitedata.getAppPermissions = sitedataRPC.getAppPermissions
+    beaker.sitedata.getAppPermission = sitedataRPC.getAppPermission
     beaker.sitedata.getPermission = sitedataRPC.getPermission
     beaker.sitedata.setPermission = sitedataRPC.setPermission
     beaker.sitedata.setAppPermissions = sitedataRPC.setAppPermissions
diff --git a/web-apis/manifests/external/navigator.js b/web-apis/manifests/external/navigator.js
index c9c1e4b1..1979bfbb 100644
--- a/web-apis/manifests/external/navigator.js
+++ b/web-apis/manifests/external/navigator.js
@@ -1,5 +1,6 @@
 module.exports = {
   beakerSelectFileDialog: 'promise',
   beakerSaveFileDialog: 'promise',
-  beakerSelectDatArchiveDialog: 'promise'
+  beakerSelectDatArchiveDialog: 'promise',
+  getApplicationState: 'promise'
 }
\ No newline at end of file
diff --git a/web-apis/manifests/internal/sitedata.js b/web-apis/manifests/internal/sitedata.js
index fd73bbc1..6a13375e 100644
--- a/web-apis/manifests/internal/sitedata.js
+++ b/web-apis/manifests/internal/sitedata.js
@@ -4,6 +4,7 @@ module.exports = {
   getPermissions: 'promise',
   getPermission: 'promise',
   getAppPermissions: 'promise',
+  getAppPermission: 'promise',
   setPermission: 'promise',
   setAppPermissions: 'promise',
   clearPermission: 'promise',

From 6565ee1139db84361c299fbeb9e9de670e159fe5 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 6 Jul 2019 13:26:59 -0500
Subject: [PATCH 210/245] Add beaker.applications.requestInstall

---
 lib/app-perms.js                            |  4 ++--
 web-apis/bg/applications.js                 | 16 ++++++++++++++++
 web-apis/fg/beaker.js                       |  1 +
 web-apis/manifests/internal/applications.js |  1 +
 4 files changed, 20 insertions(+), 2 deletions(-)

diff --git a/lib/app-perms.js b/lib/app-perms.js
index 7f9b222b..9cfbee52 100644
--- a/lib/app-perms.js
+++ b/lib/app-perms.js
@@ -3,6 +3,7 @@ const dat = require('../dat')
 const sitedataDb = require('../dbs/sitedata')
 const globals = require('../globals')
 const knex = require('../lib/knex')
+const { ucfirst } = require('../lib/strings')
 const db = require('../dbs/profile-data-db')
 const { PermissionsError } = require('beaker-error-constants')
 
@@ -74,8 +75,7 @@ const assertCan = exports.assertCan = async function (sender, perm, cap) {
  * @returns {string}
  */
 const describePerm = exports.describePerm = function (perm, caps) {
-  var capsStr = 'Read'
-  if (caps.includes('write')) capsStr = 'Read, create, and modify'
+  var capsStr = ucfirst(caps.join(' and '))
   switch (perm) {
     case 'unwalled.garden/perm/follows':
       if (caps.includes('write')) return 'Follow and unfollow sites'
diff --git a/web-apis/bg/applications.js b/web-apis/bg/applications.js
index c52c88af..100a9dc6 100644
--- a/web-apis/bg/applications.js
+++ b/web-apis/bg/applications.js
@@ -1,3 +1,4 @@
+const globals = require('../../globals')
 const dat = require('../../dat')
 const appPerms = require('../../lib/app-perms')
 const sitedataDb = require('../../dbs/sitedata')
@@ -61,6 +62,21 @@ module.exports = {
     await sitedataDb.setAppPermissions(url, getArchivePerms(archiveInfo))
   },
 
+  /**
+   * @param {string} url
+   * @returns {Promise<boolean>}
+   */
+  async requestInstall (url) {
+    // run the install modal
+    try {
+      console.log('showing modal')
+      return globals.uiAPI.showModal(this.sender, 'install-application', {url})
+    } catch (e) {
+      console.log('ohno', e)
+      return false
+    }
+  },
+
   /**
    * @returns {Promise<WebAPIApplication[]>}
    */
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index 47a17818..d7cb08f0 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -40,6 +40,7 @@ exports.setup = function (rpc) {
     beaker.applications = {}
     beaker.applications.getInfo = applicationsRPC.getInfo
     beaker.applications.install = applicationsRPC.install
+    beaker.applications.requestInstall = applicationsRPC.requestInstall
     beaker.applications.list = applicationsRPC.list
     beaker.applications.enable = applicationsRPC.enable
     beaker.applications.disable = applicationsRPC.disable
diff --git a/web-apis/manifests/internal/applications.js b/web-apis/manifests/internal/applications.js
index d156faf0..5d58a9d0 100644
--- a/web-apis/manifests/internal/applications.js
+++ b/web-apis/manifests/internal/applications.js
@@ -1,6 +1,7 @@
 module.exports = {
   getInfo: 'promise',
   install: 'promise',
+  requestInstall: 'promise',
   list: 'promise',
   enable: 'promise',
   disable: 'promise',

From 9b2895a1cc0e7dd8b779a7da336eea3d617f60d6 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 6 Jul 2019 17:31:43 -0500
Subject: [PATCH 211/245] Generate dat.json manifests based on type

---
 web-apis/bg/dat-archive.js | 17 ++++++++++++++++-
 1 file changed, 16 insertions(+), 1 deletion(-)

diff --git a/web-apis/bg/dat-archive.js b/web-apis/bg/dat-archive.js
index f3141df0..f051baa2 100644
--- a/web-apis/bg/dat-archive.js
+++ b/web-apis/bg/dat-archive.js
@@ -63,7 +63,10 @@ module.exports = {
 
       // create
       let author = await getAuthor()
-      newArchiveUrl = await datLibrary.createNewArchive({title, description, type, author, links}, {networked, hidden})
+      newArchiveUrl = await datLibrary.createNewArchive(
+        Object.assign({title, description, type, author, links}, generateManifest(type)),
+        {networked, hidden}
+      )
     }
     let newArchiveKey = await lookupUrlDatKey(newArchiveUrl)
 
@@ -670,6 +673,18 @@ function assertValidPath (fileOrFolderPath) {
   }
 }
 
+function generateManifest (type) {
+  type = Array.isArray(type) ? type : [type]
+  if (type.includes('unwalled.garden/application')) {
+    return {
+      'unwalled.garden/application': {
+        permissions: {}
+      }
+    }
+  }
+  return {}
+}
+
 // async function assertSenderIsFocused (sender) {
 //   if (!sender.isFocused()) {
 //     throw new UserDeniedError('Application must be focused to spawn a prompt')

From 66bde896b915562c4b8c8e800910585c239b706d Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 9 Jul 2019 13:49:32 -0500
Subject: [PATCH 212/245] Change unwalled.garden/application identifier to
 application

---
 web-apis/bg/applications.js | 3 +--
 web-apis/bg/dat-archive.js  | 4 ++--
 2 files changed, 3 insertions(+), 4 deletions(-)

diff --git a/web-apis/bg/applications.js b/web-apis/bg/applications.js
index 100a9dc6..881034f6 100644
--- a/web-apis/bg/applications.js
+++ b/web-apis/bg/applications.js
@@ -129,9 +129,8 @@ module.exports = {
 
 function getArchivePerms (archiveInfo) {
   try {
-    return archiveInfo.manifest['unwalled.garden/application'].permissions
+    return archiveInfo.manifest.application.permissions
   } catch (e) {
-    console.debug('No permissions found on application', archiveInfo.manifest)
     return []
   }
 }
diff --git a/web-apis/bg/dat-archive.js b/web-apis/bg/dat-archive.js
index f051baa2..d738e0b9 100644
--- a/web-apis/bg/dat-archive.js
+++ b/web-apis/bg/dat-archive.js
@@ -675,9 +675,9 @@ function assertValidPath (fileOrFolderPath) {
 
 function generateManifest (type) {
   type = Array.isArray(type) ? type : [type]
-  if (type.includes('unwalled.garden/application')) {
+  if (type.includes('application')) {
     return {
-      'unwalled.garden/application': {
+      application: {
         permissions: {}
       }
     }

From 5b3d8c360bc46cc445c79ff507bbbcbdfc5a003c Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Wed, 10 Jul 2019 13:35:46 -0500
Subject: [PATCH 213/245] Introduce app perms, temporarily deprecate media and
 discussions APIs

---
 web-apis/bg/bookmarks.js                   | 26 ++++++++--------------
 web-apis/bg/unwalled-garden-comments.js    | 24 ++++++++------------
 web-apis/bg/unwalled-garden-discussions.js | 20 +++++------------
 web-apis/bg/unwalled-garden-follows.js     | 20 +++++------------
 web-apis/bg/unwalled-garden-media.js       | 20 +++++------------
 web-apis/bg/unwalled-garden-posts.js       | 20 +++++------------
 web-apis/bg/unwalled-garden-profiles.js    | 16 ++++---------
 web-apis/bg/unwalled-garden-reactions.js   | 18 +++++----------
 web-apis/bg/unwalled-garden-tags.js        | 16 ++++---------
 web-apis/bg/unwalled-garden-votes.js       | 19 +++++-----------
 web-apis/fg/navigator-import.js            | 21 +++++++++--------
 11 files changed, 72 insertions(+), 148 deletions(-)

diff --git a/web-apis/bg/bookmarks.js b/web-apis/bg/bookmarks.js
index cba17ab1..66f992b1 100644
--- a/web-apis/bg/bookmarks.js
+++ b/web-apis/bg/bookmarks.js
@@ -1,10 +1,10 @@
 const globals = require('../../globals')
-const {PermissionsError} = require('beaker-error-constants')
 const bookmarksDb = require('../../dbs/bookmarks')
 const bookmarksCrawler = require('../../crawler/bookmarks')
 const siteDescriptions = require('../../crawler/site-descriptions')
 const {toOrigin} = require('../../crawler/util')
 const _get = require('lodash.get')
+const appPerms = require('../../lib/app-perms')
 
 // typedefs
 // =
@@ -49,7 +49,7 @@ module.exports = {
    * @returns {Promise<BookmarkPublicAPIRecord[]>}
    */
   async query (opts) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/bookmarks', 'read')
 
     // NOTE
     // The crawled and local-user bookmarks are stored in separate tables
@@ -135,7 +135,7 @@ module.exports = {
    * @returns {Promise<string[]>}
    */
   async listTags () {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/bookmarks', 'read')
     return bookmarksDb.listBookmarkTags(0)
   },
 
@@ -144,7 +144,7 @@ module.exports = {
    * @returns {Promise<BookmarkPublicAPIRecord>}
    */
   async get (href) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/bookmarks', 'read')
 
     // fetch user
     var userSession = globals.userSessionAPI.getFor(this.sender)
@@ -160,7 +160,7 @@ module.exports = {
    * @returns {Promise<boolean>}
    */
   async has (href) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/bookmarks', 'read')
     try {
       var bookmark = await bookmarksDb.getBookmark(0, href)
       return !!bookmark
@@ -180,7 +180,7 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async add (data) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/bookmarks', 'write')
     await bookmarksDb.addBookmark(0, data)
   },
 
@@ -196,7 +196,7 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async edit (href, data = {}) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/bookmarks', 'write')
     await bookmarksDb.editBookmark(0, href, data)
   },
 
@@ -205,7 +205,7 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async remove (href) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/bookmarks', 'write')
     await bookmarksDb.removeBookmark(0, href)
   },
 
@@ -215,7 +215,7 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async configure (opts) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/bookmarks', 'write')
     if (opts.pins) {
       if (!Array.isArray(opts.pins)) throw new Error('.pins must be an array of URLs')
       await bookmarksDb.setBookmarkPinOrder(0, opts.pins)
@@ -223,14 +223,6 @@ module.exports = {
   }
 }
 
-async function assertPermission (sender, perm) {
-  if (sender.getURL().startsWith('beaker:')) {
-    return true
-  }
-  if (await globals.permsAPI.requestPermission(perm, sender)) return true
-  throw new PermissionsError()
-}
-
 function normalizeInternalBookmark (bookmark, user) {
   if (!bookmark) return null
   bookmark.record = null
diff --git a/web-apis/bg/unwalled-garden-comments.js b/web-apis/bg/unwalled-garden-comments.js
index 0b06b5b4..9acb1b13 100644
--- a/web-apis/bg/unwalled-garden-comments.js
+++ b/web-apis/bg/unwalled-garden-comments.js
@@ -1,9 +1,9 @@
 const globals = require('../../globals')
 const assert = require('assert')
 const {URL} = require('url')
-const {PermissionsError} = require('beaker-error-constants')
 const dat = require('../../dat')
 const commentsCrawler = require('../../crawler/comments')
+const appPerms = require('../../lib/app-perms')
 
 // typedefs
 // =
@@ -55,7 +55,7 @@ module.exports = {
    * @returns {Promise<CommentPublicAPIRecord[]>}
    */
   async list (opts) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/comments', 'read')
     opts = (opts && typeof opts === 'object') ? opts : {}
     if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
@@ -80,6 +80,7 @@ module.exports = {
         assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
       }
     }
+
     var comments = await commentsCrawler.list(opts)
     return Promise.all(comments.map(massageCommentRecord))
   },
@@ -97,7 +98,7 @@ module.exports = {
    * @returns {Promise<CommentPublicAPIRecord[]>}
    */
   async thread (topic, opts) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/comments', 'read')
     opts = (opts && typeof opts === 'object') ? opts : {}
     assert(topic && typeof topic === 'string', 'The `topic` parameter must be a URL string')
     if (opts && 'parent' in opts) assert(typeof opts.parent === 'string', 'Parent must be a string')
@@ -116,6 +117,7 @@ module.exports = {
         assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
       }
     }
+
     var comments = await commentsCrawler.thread(topic, opts)
     return Promise.all(comments.map(massageThreadedCommentRecord))
   },
@@ -125,7 +127,7 @@ module.exports = {
    * @returns {Promise<CommentPublicAPIRecord>}
    */
   async get (url) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'read', 'data:unwalled.garden:comments')
     return massageCommentRecord(await commentsCrawler.get(url))
   },
 
@@ -138,7 +140,7 @@ module.exports = {
    * @returns {Promise<CommentPublicAPIRecord>}
    */
   async add (topic, comment) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/comments', 'write')
     var userArchive = getUserArchive(this.sender)
 
     // string usage
@@ -170,7 +172,7 @@ module.exports = {
    * @returns {Promise<CommentPublicAPIRecord>}
    */
   async edit (url, comment) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/comments', 'write')
     var userArchive = getUserArchive(this.sender)
 
     // string usage
@@ -194,7 +196,7 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async remove (url) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/comments', 'write')
     var userArchive = getUserArchive(this.sender)
 
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
@@ -207,14 +209,6 @@ module.exports = {
 // internal methods
 // =
 
-async function assertPermission (sender, perm) {
-  if (sender.getURL().startsWith('beaker:')) {
-    return true
-  }
-  if (await globals.permsAPI.requestPermission(perm, sender)) return true
-  throw new PermissionsError()
-}
-
 function getUserArchive (sender) {
   var userSession = globals.userSessionAPI.getFor(sender)
   if (!userSession) throw new Error('No active user session')
diff --git a/web-apis/bg/unwalled-garden-discussions.js b/web-apis/bg/unwalled-garden-discussions.js
index a00a5db7..51118bf9 100644
--- a/web-apis/bg/unwalled-garden-discussions.js
+++ b/web-apis/bg/unwalled-garden-discussions.js
@@ -1,9 +1,9 @@
 const globals = require('../../globals')
 const assert = require('assert')
 const {URL} = require('url')
-const {PermissionsError} = require('beaker-error-constants')
 const dat = require('../../dat')
 const discussionsCrawler = require('../../crawler/discussions')
+const appPerms = require('../../lib/app-perms')
 
 // typedefs
 // =
@@ -44,7 +44,7 @@ module.exports = {
    * @returns {Promise<DiscussionPublicAPIRecord[]>}
    */
   async list (opts) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/discussions', 'read')
     opts = (opts && typeof opts === 'object') ? opts : {}
     if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
@@ -78,7 +78,7 @@ module.exports = {
    * @returns {Promise<DiscussionPublicAPIRecord>}
    */
   async get (url) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/discussions', 'read')
     return massageDiscussionRecord(await discussionsCrawler.get(url))
   },
 
@@ -92,7 +92,7 @@ module.exports = {
    * @returns {Promise<DiscussionPublicAPIRecord>}
    */
   async add (discussion) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/discussions', 'write')
     var userArchive = getUserArchive(this.sender)
 
     assert(discussion && typeof discussion === 'object', 'The `discussion` parameter must be a string or object')
@@ -122,7 +122,7 @@ module.exports = {
    * @returns {Promise<DiscussionPublicAPIRecord>}
    */
   async edit (url, discussion) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/discussions', 'write')
     var userArchive = getUserArchive(this.sender)
 
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
@@ -143,7 +143,7 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async remove (url) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/discussions', 'write')
     var userArchive = getUserArchive(this.sender)
 
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
@@ -156,14 +156,6 @@ module.exports = {
 // internal methods
 // =
 
-async function assertPermission (sender, perm) {
-  if (sender.getURL().startsWith('beaker:')) {
-    return true
-  }
-  if (await globals.permsAPI.requestPermission(perm, sender)) return true
-  throw new PermissionsError()
-}
-
 function getUserArchive (sender) {
   var userSession = globals.userSessionAPI.getFor(sender)
   if (!userSession) throw new Error('No active user session')
diff --git a/web-apis/bg/unwalled-garden-follows.js b/web-apis/bg/unwalled-garden-follows.js
index 3a97b0de..a7f00386 100644
--- a/web-apis/bg/unwalled-garden-follows.js
+++ b/web-apis/bg/unwalled-garden-follows.js
@@ -1,9 +1,9 @@
 const globals = require('../../globals')
 const assert = require('assert')
 const {URL} = require('url')
-const {PermissionsError} = require('beaker-error-constants')
 const dat = require('../../dat')
 const followsCrawler = require('../../crawler/follows')
+const appPerms = require('../../lib/app-perms')
 
 // typedefs
 // =
@@ -38,7 +38,7 @@ module.exports = {
    * @returns {Promise<FollowsPublicAPIRecord[]>}
    */
   async list (opts) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/follows', 'read')
     opts = (opts && typeof opts === 'object') ? opts : {}
     if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
@@ -73,7 +73,7 @@ module.exports = {
    * @returns {Promise<FollowsPublicAPIRecord>}
    */
   async get (author, topic) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/follows', 'read')
 
     author = normalizeFollowUrl(author)
     topic = normalizeFollowUrl(topic)
@@ -91,7 +91,7 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async add (topic, opts) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/follows', 'write')
     var userArchive = getUserArchive(this.sender)
 
     topic = normalizeFollowUrl(topic)
@@ -110,7 +110,7 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async edit (topic, opts) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/follows', 'write')
     var userArchive = getUserArchive(this.sender)
 
     topic = normalizeFollowUrl(topic)
@@ -127,7 +127,7 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async remove (topic) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/follows', 'write')
     var userArchive = getUserArchive(this.sender)
 
     topic = normalizeFollowUrl(topic)
@@ -140,14 +140,6 @@ module.exports = {
 // internal methods
 // =
 
-async function assertPermission (sender, perm) {
-  if (sender.getURL().startsWith('beaker:')) {
-    return true
-  }
-  if (await globals.permsAPI.requestPermission(perm, sender)) return true
-  throw new PermissionsError()
-}
-
 function getUserArchive (sender) {
   var userSession = globals.userSessionAPI.getFor(sender)
   if (!userSession) throw new Error('No active user session')
diff --git a/web-apis/bg/unwalled-garden-media.js b/web-apis/bg/unwalled-garden-media.js
index b48dc730..ccc060e0 100644
--- a/web-apis/bg/unwalled-garden-media.js
+++ b/web-apis/bg/unwalled-garden-media.js
@@ -1,9 +1,9 @@
 const globals = require('../../globals')
 const assert = require('assert')
 const {URL} = require('url')
-const {PermissionsError} = require('beaker-error-constants')
 const dat = require('../../dat')
 const mediaCrawler = require('../../crawler/media')
+const appPerms = require('../../lib/app-perms')
 
 // typedefs
 // =
@@ -47,7 +47,7 @@ module.exports = {
    * @returns {Promise<MediaPublicAPIRecord[]>}
    */
   async list (opts) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/media', 'read')
     opts = (opts && typeof opts === 'object') ? opts : {}
     if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
@@ -95,7 +95,7 @@ module.exports = {
    * @returns {Promise<MediaPublicAPIRecord>}
    */
   async get (url) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/media', 'read')
     return massageMediaRecord(await mediaCrawler.get(url))
   },
 
@@ -110,7 +110,7 @@ module.exports = {
    * @returns {Promise<MediaPublicAPIRecord>}
    */
   async add (media) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/media', 'write')
     var userArchive = getUserArchive(this.sender)
 
     assert(media && typeof media === 'object', 'The `media` parameter must be a string or object')
@@ -142,7 +142,7 @@ module.exports = {
    * @returns {Promise<MediaPublicAPIRecord>}
    */
   async edit (url, media) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/media', 'write')
     var userArchive = getUserArchive(this.sender)
 
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
@@ -164,7 +164,7 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async remove (url) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/media', 'write')
     var userArchive = getUserArchive(this.sender)
 
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
@@ -177,14 +177,6 @@ module.exports = {
 // internal methods
 // =
 
-async function assertPermission (sender, perm) {
-  if (sender.getURL().startsWith('beaker:')) {
-    return true
-  }
-  if (await globals.permsAPI.requestPermission(perm, sender)) return true
-  throw new PermissionsError()
-}
-
 function getUserArchive (sender) {
   var userSession = globals.userSessionAPI.getFor(sender)
   if (!userSession) throw new Error('No active user session')
diff --git a/web-apis/bg/unwalled-garden-posts.js b/web-apis/bg/unwalled-garden-posts.js
index 65dc0e9d..fd1126e5 100644
--- a/web-apis/bg/unwalled-garden-posts.js
+++ b/web-apis/bg/unwalled-garden-posts.js
@@ -1,9 +1,9 @@
 const globals = require('../../globals')
 const assert = require('assert')
 const {URL} = require('url')
-const {PermissionsError} = require('beaker-error-constants')
 const dat = require('../../dat')
 const postsCrawler = require('../../crawler/posts')
+const appPerms = require('../../lib/app-perms')
 
 // typedefs
 // =
@@ -40,7 +40,7 @@ module.exports = {
    * @returns {Promise<PostPublicAPIRecord[]>}
    */
   async list (opts) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/posts', 'read')
     opts = (opts && typeof opts === 'object') ? opts : {}
     if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
@@ -67,7 +67,7 @@ module.exports = {
    * @returns {Promise<PostPublicAPIRecord>}
    */
   async get (url) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/posts', 'read')
     return massagePostRecord(await postsCrawler.get(url))
   },
 
@@ -78,7 +78,7 @@ module.exports = {
    * @returns {Promise<PostPublicAPIRecord>}
    */
   async add (post) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/posts', 'write')
     var userArchive = getUserArchive(this.sender)
 
     // string usage
@@ -107,7 +107,7 @@ module.exports = {
    * @returns {Promise<PostPublicAPIRecord>}
    */
   async edit (url, post) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/posts', 'write')
     var userArchive = getUserArchive(this.sender)
 
     // string usage
@@ -130,7 +130,7 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async remove (url) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/posts', 'write')
     var userArchive = getUserArchive(this.sender)
 
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
@@ -143,14 +143,6 @@ module.exports = {
 // internal methods
 // =
 
-async function assertPermission (sender, perm) {
-  if (sender.getURL().startsWith('beaker:')) {
-    return true
-  }
-  if (await globals.permsAPI.requestPermission(perm, sender)) return true
-  throw new PermissionsError()
-}
-
 function getUserArchive (sender) {
   var userSession = globals.userSessionAPI.getFor(sender)
   if (!userSession) throw new Error('No active user session')
diff --git a/web-apis/bg/unwalled-garden-profiles.js b/web-apis/bg/unwalled-garden-profiles.js
index 2a995a7f..58d2d4c4 100644
--- a/web-apis/bg/unwalled-garden-profiles.js
+++ b/web-apis/bg/unwalled-garden-profiles.js
@@ -1,7 +1,7 @@
 const globals = require('../../globals')
 const datLibrary = require('../../dat/library')
 const crawler = require('../../crawler')
-const {PermissionsError} = require('beaker-error-constants')
+const appPerms = require('../../lib/app-perms')
 
 // typedefs
 // =
@@ -36,7 +36,7 @@ module.exports = {
    * @returns {Promise<ProfilesPublicAPIRecord>}
    */
   async me () {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertInstalled(this.sender)
     var sess = globals.userSessionAPI.getFor(this.sender)
     if (!sess) return null
     return get(sess.url)
@@ -47,7 +47,7 @@ module.exports = {
    * @returns {Promise<ProfilesPublicAPIRecord>}
    */
   async get (url) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertInstalled(this.sender)
     return get(url)
   },
 
@@ -56,20 +56,12 @@ module.exports = {
    * @returns {Promise<ProfilesPublicAPIRecord>}
    */
   async index (url) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertInstalled(this.sender)
     await crawler.crawlSite(url)
     return get(url)
   }
 }
 
-async function assertPermission (sender, perm) {
-  if (sender.getURL().startsWith('beaker:')) {
-    return true
-  }
-  if (await globals.permsAPI.requestPermission(perm, sender)) return true
-  throw new PermissionsError()
-}
-
 function toOrigin (url) {
   try {
     let urlp = new URL(url)
diff --git a/web-apis/bg/unwalled-garden-reactions.js b/web-apis/bg/unwalled-garden-reactions.js
index cc8337c7..f919e231 100644
--- a/web-apis/bg/unwalled-garden-reactions.js
+++ b/web-apis/bg/unwalled-garden-reactions.js
@@ -1,10 +1,10 @@
 const globals = require('../../globals')
 const assert = require('assert')
 const {URL} = require('url')
-const {PermissionsError} = require('beaker-error-constants')
 const dat = require('../../dat')
 const reactionsCrawler = require('../../crawler/reactions')
 const siteDescriptionsCrawler = require('../../crawler/site-descriptions')
+const appPerms = require('../../lib/app-perms')
 
 // typedefs
 // =
@@ -48,7 +48,7 @@ module.exports = {
    * @returns {Promise<ReactionPublicAPIRecord[]>}
    */
   async list (opts) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/reactions', 'read')
     opts = (opts && typeof opts === 'object') ? opts : {}
     if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
@@ -85,7 +85,7 @@ module.exports = {
    * @returns {Promise<TopicReactionsPublicAPIRecord[]>}
    */
   async tabulate (topic, opts) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/reactions', 'read')
     topic = normalizeTopicUrl(topic)
     assert(topic && typeof topic === 'string', 'The `topic` parameter must be a valid URL')
     opts = (opts && typeof opts === 'object') ? opts : {}
@@ -124,7 +124,7 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async add (topic, emoji) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/reactions', 'write')
     var userArchive = getUserArchive(this.sender)
 
     topic = normalizeTopicUrl(topic)
@@ -139,7 +139,7 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async remove (topic, emoji) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/reactions', 'write')
     var userArchive = getUserArchive(this.sender)
 
     topic = normalizeTopicUrl(topic)
@@ -152,14 +152,6 @@ module.exports = {
 // internal methods
 // =
 
-async function assertPermission (sender, perm) {
-  if (sender.getURL().startsWith('beaker:')) {
-    return true
-  }
-  if (await globals.permsAPI.requestPermission(perm, sender)) return true
-  throw new PermissionsError()
-}
-
 function getUserArchive (sender) {
   var userSession = globals.userSessionAPI.getFor(sender)
   if (!userSession) throw new Error('No active user session')
diff --git a/web-apis/bg/unwalled-garden-tags.js b/web-apis/bg/unwalled-garden-tags.js
index c6048f77..41b8b819 100644
--- a/web-apis/bg/unwalled-garden-tags.js
+++ b/web-apis/bg/unwalled-garden-tags.js
@@ -1,7 +1,7 @@
 const globals = require('../../globals')
 const assert = require('assert')
-const {PermissionsError} = require('beaker-error-constants')
 const tagsCrawler = require('../../crawler/tags')
+const appPerms = require('../../lib/app-perms')
 
 // typedefs
 // =
@@ -30,7 +30,7 @@ module.exports = {
    * @returns {Promise<TagPublicAPIRecord[]>}
    */
   async listBookmarkTags (opts) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/bookmarks', 'read')
     opts = (opts && typeof opts === 'object') ? opts : {}
     if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
@@ -64,7 +64,7 @@ module.exports = {
    * @returns {Promise<TagPublicAPIRecord[]>}
    */
   async listDiscussionTags (opts) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/discussions', 'read')
     opts = (opts && typeof opts === 'object') ? opts : {}
     if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
@@ -99,7 +99,7 @@ module.exports = {
    * @returns {Promise<TagPublicAPIRecord[]>}
    */
   async listMediaTags (opts) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/media', 'read')
     opts = (opts && typeof opts === 'object') ? opts : {}
     if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
@@ -132,14 +132,6 @@ module.exports = {
 // internal methods
 // =
 
-async function assertPermission (sender, perm) {
-  if (sender.getURL().startsWith('beaker:')) {
-    return true
-  }
-  if (await globals.permsAPI.requestPermission(perm, sender)) return true
-  throw new PermissionsError()
-}
-
 /**
  * @param {Tag} tag
  * @returns {TagPublicAPIRecord}
diff --git a/web-apis/bg/unwalled-garden-votes.js b/web-apis/bg/unwalled-garden-votes.js
index a4c37232..9c6a003c 100644
--- a/web-apis/bg/unwalled-garden-votes.js
+++ b/web-apis/bg/unwalled-garden-votes.js
@@ -1,10 +1,9 @@
 const globals = require('../../globals')
 const assert = require('assert')
 const {URL} = require('url')
-const {PermissionsError} = require('beaker-error-constants')
 const dat = require('../../dat')
 const votesCrawler = require('../../crawler/votes')
-const siteDescriptionsCrawler = require('../../crawler/site-descriptions')
+const appPerms = require('../../lib/app-perms')
 
 // typedefs
 // =
@@ -53,7 +52,7 @@ module.exports = {
    * @returns {Promise<VotePublicAPIRecord[]>}
    */
   async list (opts) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/votes', 'read')
     opts = (opts && typeof opts === 'object') ? opts : {}
     if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
@@ -90,7 +89,7 @@ module.exports = {
    * @returns {Promise<TabulatedVotesPublicAPIRecord>}
    */
   async tabulate (topic, opts) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/votes', 'read')
     topic = normalizeTopicUrl(topic)
     assert(topic && typeof topic === 'string', 'The `topic` parameter must be a valid URL')
     opts = (opts && typeof opts === 'object') ? opts : {}
@@ -133,7 +132,7 @@ module.exports = {
    * @returns {Promise<VotePublicAPIRecord>}
    */
   async get (author, topic) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/votes', 'read')
     return massageVoteRecord(await votesCrawler.get(author, topic))
   },
 
@@ -143,7 +142,7 @@ module.exports = {
    * @returns {Promise<VotePublicAPIRecord>}
    */
   async set (topic, vote) {
-    await assertPermission(this.sender, 'dangerousAppControl')
+    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/votes', 'write')
     var userArchive = getUserArchive(this.sender)
 
     topic = normalizeTopicUrl(topic)
@@ -157,14 +156,6 @@ module.exports = {
 // internal methods
 // =
 
-async function assertPermission (sender, perm) {
-  if (sender.getURL().startsWith('beaker:')) {
-    return true
-  }
-  if (await globals.permsAPI.requestPermission(perm, sender)) return true
-  throw new PermissionsError()
-}
-
 function getUserArchive (sender) {
   var userSession = globals.userSessionAPI.getFor(sender)
   if (!userSession) throw new Error('No active user session')
diff --git a/web-apis/fg/navigator-import.js b/web-apis/fg/navigator-import.js
index d8defba1..57c8c4c6 100644
--- a/web-apis/fg/navigator-import.js
+++ b/web-apis/fg/navigator-import.js
@@ -28,18 +28,20 @@ const APIs = {
     manifest: require('../manifests/external/unwalled-garden-comments'),
     create: makeCreateFn('unwalled-garden-comments')
   },
-  'unwalled-garden-discussions': {
-    manifest: require('../manifests/external/unwalled-garden-discussions'),
-    create: makeCreateFn('unwalled-garden-discussions')
-  },
+  // TODO readd when stablized -prf
+  // 'unwalled-garden-discussions': {
+  //   manifest: require('../manifests/external/unwalled-garden-discussions'),
+  //   create: makeCreateFn('unwalled-garden-discussions')
+  // },
   'unwalled-garden-follows': {
     manifest: require('../manifests/external/unwalled-garden-follows'),
     create: makeCreateFn('unwalled-garden-follows')
   },
-  'unwalled-garden-media': {
-    manifest: require('../manifests/external/unwalled-garden-media'),
-    create: makeCreateFn('unwalled-garden-media')
-  },
+  // TODO readd when stablized -prf
+  // 'unwalled-garden-media': {
+  //   manifest: require('../manifests/external/unwalled-garden-media'),
+  //   create: makeCreateFn('unwalled-garden-media')
+  // },
   'unwalled-garden-posts': {
     manifest: require('../manifests/external/unwalled-garden-posts'),
     create: makeCreateFn('unwalled-garden-posts')
@@ -72,7 +74,8 @@ exports.setup = function (rpc) {
       cache[name] = API.create(rpc)
       return cache[name]
     }
-    throw new Error(`Unknown API: ${name}`)
+    console.error(`Unknown API: ${name}`)
+    return null
   }
 }
 

From e9a9766fbee1de4ed7b3bfe8e0ab626df5bd8147 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 14 Jul 2019 18:22:23 -0500
Subject: [PATCH 214/245] Add support and tracking for dat archive DNS names

---
 crawler/index.js                    | 47 ++++++++++++++--
 crawler/util.js                     | 29 ++++++----
 dat/dns.js                          | 11 ++--
 dat/library.js                      | 31 ++++++++++-
 dbs/archives.js                     |  7 ++-
 dbs/dat-dns.js                      | 86 +++++++++++++++++++++++++++++
 dbs/profile-data-db.js              |  3 +-
 dbs/schemas/profile-data.sql.js     | 16 +++++-
 dbs/schemas/profile-data.v35.sql.js | 17 ++++++
 dbs/sitedata.js                     |  3 -
 lib/app-perms.js                    |  3 +-
 users/index.js                      |  5 +-
 web-apis/bg/dat-archive.js          |  1 +
 web-apis/fg/dat-archive.js          | 57 ++++++-------------
 14 files changed, 238 insertions(+), 78 deletions(-)
 create mode 100644 dbs/dat-dns.js
 create mode 100644 dbs/schemas/profile-data.v35.sql.js

diff --git a/crawler/index.js b/crawler/index.js
index af09dd41..4b92bd1b 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -2,6 +2,7 @@ const emitStream = require('emit-stream')
 const _throttle = require('lodash.throttle')
 const logger = require('../logger').category('crawler')
 const lock = require('../lib/lock')
+const knex = require('../lib/knex')
 const db = require('../dbs/profile-data-db')
 const archivesDb = require('../dbs/archives')
 const dat = require('../dat')
@@ -84,11 +85,33 @@ exports.crawlSite = async function (archive) {
   crawlerEvents.emit('crawl-start', {sourceUrl: archive.url})
   var release = await lock('crawl:' + archive.url)
   try {
+    // use DNS only on non-local archives
+    const useDns = !archive.writable
+    var url = useDns ? archive.url : `dat://${archive.key.toString('hex')}`
+
+    // fetch current dns record
+    var datDnsRecord = null
+    if (useDns && archive.dnsName) {
+      datDnsRecord = await db.get(knex('dat_dns').where({name: archive.dnsName, isCurrent: 1}))
+    }
+
     // get/create crawl source
-    var crawlSource = await db.get(`SELECT id, url FROM crawl_sources WHERE url = ?`, [archive.url])
+    var crawlSource = await db.get(`SELECT id, url, datDnsId FROM crawl_sources WHERE url = ?`, [url])
     if (!crawlSource) {
-      let res = await db.run(`INSERT INTO crawl_sources (url) VALUES (?)`, [archive.url])
-      crawlSource = {id: res.lastID, url: archive.url}
+      let res = await db.run(knex('crawl_sources').insert({
+        url,
+        datDnsId: datDnsRecord ? datDnsRecord.id : undefined
+      }))
+      crawlSource = {id: res.lastID, url, datDnsId: datDnsRecord ? datDnsRecord.id : undefined}
+    }
+    crawlSource.globalResetRequired = false
+
+    // check for dns changes
+    var didDnsChange = datDnsRecord && crawlSource.datDnsId !== datDnsRecord.id
+    if (didDnsChange) {
+      crawlSource.globalResetRequired = true
+      logger.verbose('Site DNS change detected, recrawling site', {details: {url: archive.url}})
+      crawlerEvents.emit('crawl-dns-change', {sourceUrl: archive.url})
     }
 
     // crawl individual sources
@@ -103,6 +126,15 @@ exports.crawlSite = async function (archive) {
       siteDescriptions.crawlSite(archive, crawlSource),
       votes.crawlSite(archive, crawlSource)
     ])
+
+    // update dns tracking
+    if (didDnsChange) {
+      await db.run(
+        knex('crawl_sources')
+          .update({datDnsId: datDnsRecord.id})
+          .where({id: crawlSource.id})
+      )
+    }
   } catch (err) {
     logger.error('Failed to crawl site', {details: {url: archive.url, err: err.toString()}})
     crawlerEvents.emit('crawl-error', {sourceUrl: archive.url, err: err.toString()})
@@ -131,8 +163,13 @@ exports.getCrawlStates = async function () {
     for (let i = 0; i < datasets.length; i++) {
       datasetVersions[datasets[i]] = Number(versions[i])
     }
-    var meta = await archivesDb.getMeta(toHostname(url))
-    return {url, title: meta.title, datasetVersions, updatedAt}
+    try {
+      var meta = await archivesDb.getMeta(toHostname(url))
+      return {url, title: meta.title, datasetVersions, updatedAt}
+    } catch (e) {
+      console.error('Error loading archive meta', url, e)
+      return {url, title: '', datasetVersions: {}, updatedAt: null}
+    }
   }))
 }
 
diff --git a/crawler/util.js b/crawler/util.js
index 6c538bdf..484086f4 100644
--- a/crawler/util.js
+++ b/crawler/util.js
@@ -2,6 +2,7 @@ const EventEmitter = require('events')
 const pump = require('pump')
 const concat = require('concat-stream')
 const db = require('../dbs/profile-data-db')
+const knex = require('../lib/knex')
 const dat = require('../dat')
 
 const READ_TIMEOUT = 30e3
@@ -15,6 +16,8 @@ const READ_TIMEOUT = 30e3
  * @typedef {Object} CrawlSourceRecord
  * @prop {string} id
  * @prop {string} url
+ * @prop {number} datDnsId
+ * @prop {boolean} globalResetRequired
  */
 
 // exported api
@@ -36,11 +39,12 @@ exports.doCrawl = async function (archive, crawlSource, crawlDataset, crawlDatas
 
   // fetch current crawl state
   var resetRequired = false
-  var state = await db.get(`
-    SELECT crawlSourceVersion, crawlDatasetVersion FROM crawl_sources_meta
-      WHERE crawlSourceId = ? AND crawlDataset = ?
-  `, [crawlSource.id, crawlDataset])
-  if (state && state.crawlDatasetVersion !== crawlDatasetVersion) {
+  var state = await db.get(
+    knex('crawl_sources_meta')
+      .select('crawl_sources_meta.*')
+      .where({crawlSourceId: crawlSource.id, crawlDataset})
+  )
+  if (crawlSource.globalResetRequired || (state && state.crawlDatasetVersion !== crawlDatasetVersion)) {
     resetRequired = true
     state = null
   }
@@ -82,12 +86,15 @@ exports.doCrawl = async function (archive, crawlSource, crawlDataset, crawlDatas
  * @returns {Promise}
  */
 const doCheckpoint = exports.doCheckpoint = async function (crawlDataset, crawlDatasetVersion, crawlSource, crawlSourceVersion) {
-  await db.run(`DELETE FROM crawl_sources_meta WHERE crawlDataset = ? AND crawlSourceId = ?`, [crawlDataset, crawlSource.id])
-  await db.run(`
-    INSERT
-      INTO crawl_sources_meta (crawlDataset, crawlDatasetVersion, crawlSourceId, crawlSourceVersion, updatedAt)
-      VALUES (?, ?, ?, ?, ?)
-  `, [crawlDataset, crawlDatasetVersion, crawlSource.id, crawlSourceVersion, Date.now()])
+  // TODO chould this be an INSERT OR REPLACE?
+  await db.run(knex('crawl_sources_meta').delete().where({crawlDataset, crawlSourceId: crawlSource.id}))
+  await db.run(knex('crawl_sources_meta').insert({
+    crawlDataset,
+    crawlDatasetVersion,
+    crawlSourceId: crawlSource.id,
+    crawlSourceVersion,
+    updatedAt: Date.now()
+  }))
 }
 
 /**
diff --git a/dat/dns.js b/dat/dns.js
index 055ca105..5767b815 100644
--- a/dat/dns.js
+++ b/dat/dns.js
@@ -1,6 +1,6 @@
 const parseDatURL = require('parse-dat-url')
 const {InvalidDomainName} = require('beaker-error-constants')
-const sitedataDb = require('../dbs/sitedata')
+const datDnsDb = require('../dbs/dat-dns')
 const {DAT_HASH_REGEX} = require('../lib/const')
 const logger = require('../logger').child({category: 'dat', subcategory: 'dns'})
 
@@ -25,14 +25,13 @@ datDns.resolveName = async function (name, opts, cb) {
 }
 
 // persistent cache methods
-const sitedataDbOpts = {dontExtractOrigin: true}
 async function read (name, err) {
   // check the cache
-  var key = await sitedataDb.get('dat:' + name, 'dat-key', sitedataDbOpts)
-  if (!key) throw err
-  return key
+  var record = await datDnsDb.getCurrentByName(name)
+  if (!record) throw err
+  return record.key
 }
 async function write (name, key) {
   if (DAT_HASH_REGEX.test(name)) return // dont write for raw urls
-  await sitedataDb.set('dat:' + name, 'dat-key', key, sitedataDbOpts)
+  await datDnsDb.update({name, key})
 }
diff --git a/dat/library.js b/dat/library.js
index fa4fe22d..81cfe60b 100644
--- a/dat/library.js
+++ b/dat/library.js
@@ -13,6 +13,7 @@ const logger = baseLogger.child({category: 'dat', subcategory: 'library'})
 const siteData = require('../dbs/sitedata')
 const settingsDb = require('../dbs/settings')
 const archivesDb = require('../dbs/archives')
+const datDnsDb = require('../dbs/dat-dns')
 
 // dat modules
 const datGC = require('./garbage-collector')
@@ -38,6 +39,7 @@ const DAT_DAEMON_MANIFEST = require('./daemon/manifest')
  * @typedef {Object} InternalDatArchive
  * @prop {Buffer} key
  * @prop {string} url
+ * @prop {string?} dnsName
  * @prop {Buffer} discoveryKey
  * @prop {boolean} writable
  * @prop {function(Function): void} ready
@@ -131,6 +133,12 @@ exports.setup = async function setup ({rpcAPI, datDaemonProcess, disallowedSaveP
     // update the download based on these settings
     daemon.configureArchive(key, userSettings)
   })
+  datDnsDb.on('update', ({key, name}) => {
+    var archive = getArchive(key)
+    if (archive) {
+      archive.dnsName = name
+    }
+  })
 
   // re-export events
   daemonEvents.on('network-changed', evt => archivesEvents.emit('network-changed', evt))
@@ -395,6 +403,10 @@ async function loadArchiveInner (key, secretKey, userSettings = null) {
   // create the archive proxy instance
   var archive = createArchiveProxy(key, undefined, archiveInfo)
 
+  // fetch dns name if known
+  let dnsRecord = await datDnsDb.getCurrentByKey(datEncoding.toStr(key))
+  archive.dnsName = dnsRecord ? dnsRecord.name : undefined
+
   // update db
   archivesDb.touch(key).catch(err => console.error('Failed to update lastAccessTime for archive', key, err))
   await pullLatestArchiveMeta(archive)
@@ -432,11 +444,13 @@ exports.getArchiveCheckout = function getArchiveCheckout (archive, version) {
       } else if (version === 'preview') {
         isPreview = true
         checkoutFS = createArchiveProxy(archive.key, 'preview', archive)
+        checkoutFS.dnsName = archive.dnsName
       } else {
         throw new Error('Invalid version identifier:' + version)
       }
     } else {
       checkoutFS = createArchiveProxy(archive.key, version, archive)
+      checkoutFS.dnsName = archive.dnsName
       isHistoric = true
     }
   }
@@ -511,7 +525,7 @@ exports.queryArchives = async function queryArchives (query) {
 
 exports.getArchiveInfo = async function getArchiveInfo (key) {
   // get the archive
-  key = fromURLToKey(key)
+  key = await fromURLToKey(key, true)
   var archive = await getOrLoadArchive(key)
 
   // fetch archive data
@@ -523,7 +537,8 @@ exports.getArchiveInfo = async function getArchiveInfo (key) {
   ])
   manifest = manifest || {}
   meta.key = key
-  meta.url = `dat://${key}`
+  meta.url = archive.url
+  meta.dnsName = archive.dnsName
   meta.links = manifest.links || {}
   meta.manifest = manifest
   meta.version = archiveInfo.version
@@ -630,13 +645,23 @@ function fixStatObject (st) {
   st.isFIFO = () => false
 }
 
+/**
+ * 
+ * @param {string|Buffer} key 
+ * @param {number} version 
+ * @param {Object} archiveInfo 
+ * @returns {InternalDatArchive}
+ */
 function createArchiveProxy (key, version, archiveInfo) {
   key = datEncoding.toStr(key)
   const stat = makeArchiveProxyCbFn(key, version, 'stat')
   const pdaStat = makeArchiveProxyPDAPromiseFn(key, version, 'stat')
   return {
     key: datEncoding.toBuf(key),
-    url: `dat://${key}`,
+    get url () {
+      return `dat://${this.dnsName || key}${version ? '+' + version : ''}`
+    },
+    dnsName: undefined,
     discoveryKey: datEncoding.toBuf(archiveInfo.discoveryKey),
     writable: archiveInfo.writable,
 
diff --git a/dbs/archives.js b/dbs/archives.js
index 721ea85c..9187bbe7 100644
--- a/dbs/archives.js
+++ b/dbs/archives.js
@@ -21,6 +21,7 @@ const {
  * @typedef {Object} LibraryArchiveRecord
  * @prop {string} key
  * @prop {string} url
+ * @prop {string?} dnsName
  * @prop {string} title
  * @prop {string} description
  * @prop {Array<string>} type
@@ -202,17 +203,19 @@ exports.query = async function (profileId, query = {}) {
         archives.autoUpload,
         archives.expiresAt,
         archives.localSyncPath,
-        archives.previewMode
+        archives.previewMode,
+        dat_dns.name as dnsName
       FROM archives_meta
       LEFT JOIN archives ON archives.key = archives_meta.key
       LEFT JOIN archives_meta_type ON archives_meta_type.key = archives_meta.key
+      LEFT JOIN dat_dns ON dat_dns.key = archives_meta.key AND dat_dns.isCurrent = 1
       ${WHERE}
       GROUP BY archives_meta.key
   `, values)
 
   // massage the output
   archives.forEach(archive => {
-    archive.url = `dat://${archive.key}`
+    archive.url = `dat://${archive.dnsName || archive.key}`
     archive.isOwner = archive.isOwner != 0
     archive.type = archive.type ? archive.type.split(',') : []
     archive.userSettings = {
diff --git a/dbs/dat-dns.js b/dbs/dat-dns.js
new file mode 100644
index 00000000..4631514d
--- /dev/null
+++ b/dbs/dat-dns.js
@@ -0,0 +1,86 @@
+const EventEmitter = require('events')
+const db = require('./profile-data-db')
+const knex = require('../lib/knex')
+const lock = require('../lib/lock')
+
+// typedefs
+// =
+
+/**
+ * @typedef {Object} DatDnsRecord
+ * @prop {string} name
+ * @prop {string} key
+ * @prop {boolean} isCurrent
+ * @prop {number} lastConfirmedAt
+ * @prop {number} firstConfirmedAt
+ */
+
+// globals
+// =
+
+const events = new EventEmitter()
+
+// exported api
+// =
+
+exports.on = events.on.bind(events)
+exports.once = events.once.bind(events)
+exports.removeListener = events.removeListener.bind(events)
+
+/**
+ * @param {string} name
+ * @returns {Promise<DatDnsRecord>}
+ */
+exports.getCurrentByName = async function (name) {
+  return massageDNSRecord(await db.get(knex('dat_dns').where({name, isCurrent: 1})))
+}
+
+/**
+ * @param {string} key
+ * @returns {Promise<DatDnsRecord>}
+ */
+exports.getCurrentByKey = async function (key) {
+  return massageDNSRecord(await db.get(knex('dat_dns').where({key, isCurrent: 1}).orderBy('name')))
+}
+
+/**
+ * @param {Object} opts
+ * @param {string} opts.key
+ * @param {string} opts.name
+ * @returns {Promise<void>}
+ */
+exports.update = async function ({key, name}) {
+  var release = await lock('dat-dns-update:' + name)
+  try {
+    let curr = await db.get(knex('dat_dns').where({name, key}))
+    if (!curr) {
+      await db.run(knex('dat_dns').update({isCurrent: 0}).where({name}))
+      await db.run(knex('dat_dns').insert({
+        name,
+        key,
+        isCurrent: 1,
+        lastConfirmedAt: Date.now(),
+        firstConfirmedAt: Date.now()
+      }))
+    } else {
+      await db.run(knex('dat_dns').update({lastConfirmedAt: Date.now()}).where({name, key}))
+    }
+    events.emit('update', {key, name})
+  } finally {
+    release()
+  }
+}
+
+// internal methods
+// =
+
+function massageDNSRecord (record) {
+  if (!record) return null
+  return {
+    name: record.name,
+    key: record.key,
+    isCurrent: Boolean(record.isCurrent),
+    lastConfirmedAt: record.lastConfirmedAt,
+    firstConfirmedAt: record.firstConfirmedAt
+  }
+}
\ No newline at end of file
diff --git a/dbs/profile-data-db.js b/dbs/profile-data-db.js
index 5b72d26f..d2314cca 100644
--- a/dbs/profile-data-db.js
+++ b/dbs/profile-data-db.js
@@ -121,7 +121,8 @@ migrations = [
   migration('profile-data.v31.sql'),
   migration('profile-data.v32.sql'),
   migration('profile-data.v33.sql'),
-  migration('profile-data.v34.sql')
+  migration('profile-data.v34.sql'),
+  migration('profile-data.v35.sql')
 ]
 function migration (file, opts = {}) {
   return cb => {
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index ff44604f..085e715c 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -55,6 +55,17 @@ CREATE TABLE archives_meta_type (
   type TEXT
 );
 
+CREATE TABLE dat_dns (
+  id INTEGER PRIMARY KEY,
+  name TEXT,
+  key TEXT,
+  isCurrent INTEGER,
+  lastConfirmedAt INTEGER,
+  firstConfirmedAt INTEGER
+);
+CREATE INDEX dat_dns_name ON dat_dns (name);
+CREATE INDEX dat_dns_key ON dat_dns (key);
+
 CREATE TABLE bookmarks (
   profileId INTEGER,
   url TEXT NOT NULL,
@@ -130,7 +141,8 @@ CREATE TABLE templates (
 -- list of sites being crawled
 CREATE TABLE crawl_sources (
   id INTEGER PRIMARY KEY NOT NULL,
-  url TEXT NOT NULL
+  url TEXT NOT NULL,
+  datDnsId INTEGER,
 );
 
 -- tracking information on the crawl-state of the sources
@@ -454,5 +466,5 @@ INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Library', 'beaker://library/', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker.Social', 'dat://beaker.social', 1);
 
-PRAGMA user_version = 34;
+PRAGMA user_version = 35;
 `
diff --git a/dbs/schemas/profile-data.v35.sql.js b/dbs/schemas/profile-data.v35.sql.js
new file mode 100644
index 00000000..ef5270a2
--- /dev/null
+++ b/dbs/schemas/profile-data.v35.sql.js
@@ -0,0 +1,17 @@
+module.exports = `
+
+CREATE TABLE dat_dns (
+  id INTEGER PRIMARY KEY,
+  name TEXT,
+  key TEXT,
+  isCurrent INTEGER,
+  lastConfirmedAt INTEGER,
+  firstConfirmedAt INTEGER
+);
+CREATE INDEX dat_dns_name ON dat_dns (name);
+CREATE INDEX dat_dns_key ON dat_dns (key);
+
+ALTER TABLE crawl_sources ADD COLUMN datDnsId INTEGER;
+
+PRAGMA user_version = 35;
+`
\ No newline at end of file
diff --git a/dbs/sitedata.js b/dbs/sitedata.js
index f3b81d13..030dd1f5 100644
--- a/dbs/sitedata.js
+++ b/dbs/sitedata.js
@@ -253,9 +253,6 @@ exports.WEBAPI = {
 async function extractOrigin (originURL) {
   var urlp = parseDatUrl(originURL)
   if (!urlp || !urlp.host || !urlp.protocol) return
-  if (urlp.protocol === 'dat:') {
-    urlp.host = await datDns.resolveName(urlp.host)
-  }
   return (urlp.protocol + urlp.host)
 }
 
diff --git a/lib/app-perms.js b/lib/app-perms.js
index 9cfbee52..d4d5fa5e 100644
--- a/lib/app-perms.js
+++ b/lib/app-perms.js
@@ -25,8 +25,7 @@ const toDatOrigin = exports.toDatOrigin = async function (url) {
     throw new Error('Invalid URL: ' + url)
   }
   if (urlParsed.protocol !== 'dat:') throw new Error('Can only install dat applications')
-  urlParsed.hostname = await dat.dns.resolveName(urlParsed.hostname)
-  return urlParsed.protocol + '//' + urlParsed.hostname
+  return `${urlParsed.protocol}//${urlParsed.hostname}`.replace('+preview', '')
 }
 
 /**
diff --git a/users/index.js b/users/index.js
index 6791bddf..37ec3a4b 100644
--- a/users/index.js
+++ b/users/index.js
@@ -370,11 +370,10 @@ async function selectNextCrawlTargets (user) {
  * @returns {Promise<User>}
  */
 async function fetchUserInfo (user) {
-  var urlp = new URL(user.url)
-  var meta = await archivesDb.getMeta(urlp.hostname)
+  var meta = await archivesDb.getMeta(user.archive.key)
   return {
     label: user.label,
-    url: normalizeUrl(user.url),
+    url: user.archive.url,
     archive: user.archive,
     isDefault: user.isDefault,
     isTemporary: user.isTemporary,
diff --git a/web-apis/bg/dat-archive.js b/web-apis/bg/dat-archive.js
index d738e0b9..4cba76a2 100644
--- a/web-apis/bg/dat-archive.js
+++ b/web-apis/bg/dat-archive.js
@@ -170,6 +170,7 @@ module.exports = {
       return {
         key: info.key,
         url: info.url,
+        dnsName: info.dnsName,
         isOwner: info.isOwner,
         // networked: info.userSettings.networked,
 
diff --git a/web-apis/fg/dat-archive.js b/web-apis/fg/dat-archive.js
index 4bb4fc81..6a553bd7 100644
--- a/web-apis/fg/dat-archive.js
+++ b/web-apis/fg/dat-archive.js
@@ -5,7 +5,6 @@ const {EventTarget, Event, fromEventStream} = require('./event-target')
 const Stat = require('./stat')
 
 const LOAD_PROMISE = Symbol('LOAD_PROMISE')
-const URL_PROMISE = Symbol('URL_PROMISE')
 const NETWORK_ACT_STREAM = Symbol() // eslint-disable-line
 
 exports.setup = function (rpc) {
@@ -34,29 +33,20 @@ exports.setup = function (rpc) {
       }
       url = 'dat://' + urlParsed.hostname + (urlParsed.version ? `+${urlParsed.version}` : '')
 
-      // load into the 'active' (in-memory) cache
-      setHidden(this, LOAD_PROMISE, datRPC.loadArchive(url))
-
-      // resolve the URL (DNS)
-      const urlPromise = DatArchive.resolveName(url).then(url => {
-        if (urlParsed.version) {
-          url += `+${urlParsed.version}`
-        }
-        return 'dat://' + url
-      })
-      setHidden(this, URL_PROMISE, urlPromise)
-
       // define this.url as a frozen getter
       Object.defineProperty(this, 'url', {
         enumerable: true,
         value: url
       })
+
+      // load into the 'active' (in-memory) cache
+      setHidden(this, LOAD_PROMISE, datRPC.loadArchive(url))
     }
 
     static load (url) {
       var errStack = (new Error()).stack
       const a = new DatArchive(url)
-      return Promise.all([a[LOAD_PROMISE], a[URL_PROMISE]])
+      return a[LOAD_PROMISE]
         .then(() => a)
         .catch(e => throwWithFixedStack(e, errStack))
     }
@@ -100,8 +90,7 @@ exports.setup = function (rpc) {
     async getInfo (opts = {}) {
       var errStack = (new Error()).stack
       try {
-        var url = await this[URL_PROMISE]
-        return await datRPC.getInfo(url, opts)
+        return await datRPC.getInfo(this.url, opts)
       } catch (e) {
         throwWithFixedStack(e, errStack)
       }
@@ -110,8 +99,7 @@ exports.setup = function (rpc) {
     async configure (info, opts = {}) {
       var errStack = (new Error()).stack
       try {
-        var url = await this[URL_PROMISE]
-        return await datRPC.configure(url, info, opts)
+        return await datRPC.configure(this.url, info, opts)
       } catch (e) {
         throwWithFixedStack(e, errStack)
       }
@@ -144,8 +132,7 @@ exports.setup = function (rpc) {
     async history (opts = {}) {
       var errStack = (new Error()).stack
       try {
-        var url = await this[URL_PROMISE]
-        return await datRPC.history(url, opts)
+        return await datRPC.history(this.url, opts)
       } catch (e) {
         throwWithFixedStack(e, errStack)
       }
@@ -154,8 +141,7 @@ exports.setup = function (rpc) {
     async stat (path, opts = {}) {
       var errStack = (new Error()).stack
       try {
-        var url = await this[URL_PROMISE]
-        return new Stat(await datRPC.stat(url, path, opts))
+        return new Stat(await datRPC.stat(this.url, path, opts))
       } catch (e) {
         throwWithFixedStack(e, errStack)
       }
@@ -164,8 +150,7 @@ exports.setup = function (rpc) {
     async readFile (path, opts = {}) {
       var errStack = (new Error()).stack
       try {
-        var url = await this[URL_PROMISE]
-        return await datRPC.readFile(url, path, opts)
+        return await datRPC.readFile(this.url, path, opts)
       } catch (e) {
         throwWithFixedStack(e, errStack)
       }
@@ -174,8 +159,7 @@ exports.setup = function (rpc) {
     async writeFile (path, data, opts = {}) {
       var errStack = (new Error()).stack
       try {
-        var url = await this[URL_PROMISE]
-        return await datRPC.writeFile(url, path, data, opts)
+        return await datRPC.writeFile(this.url, path, data, opts)
       } catch (e) {
         throwWithFixedStack(e, errStack)
       }
@@ -184,8 +168,7 @@ exports.setup = function (rpc) {
     async unlink (path, opts = {}) {
       var errStack = (new Error()).stack
       try {
-        var url = await this[URL_PROMISE]
-        return await datRPC.unlink(url, path, opts)
+        return await datRPC.unlink(this.url, path, opts)
       } catch (e) {
         throwWithFixedStack(e, errStack)
       }
@@ -194,8 +177,7 @@ exports.setup = function (rpc) {
     async copy (path, dstPath, opts = {}) {
       var errStack = (new Error()).stack
       try {
-        var url = await this[URL_PROMISE]
-        return datRPC.copy(url, path, dstPath, opts)
+        return datRPC.copy(this.url, path, dstPath, opts)
       } catch (e) {
         throwWithFixedStack(e, errStack)
       }
@@ -204,8 +186,7 @@ exports.setup = function (rpc) {
     async rename (path, dstPath, opts = {}) {
       var errStack = (new Error()).stack
       try {
-        var url = await this[URL_PROMISE]
-        return datRPC.rename(url, path, dstPath, opts)
+        return datRPC.rename(this.url, path, dstPath, opts)
       } catch (e) {
         throwWithFixedStack(e, errStack)
       }
@@ -214,8 +195,7 @@ exports.setup = function (rpc) {
     async download (path = '/', opts = {}) {
       var errStack = (new Error()).stack
       try {
-        var url = await this[URL_PROMISE]
-        return await datRPC.download(url, path, opts)
+        return await datRPC.download(this.url, path, opts)
       } catch (e) {
         throwWithFixedStack(e, errStack)
       }
@@ -224,8 +204,7 @@ exports.setup = function (rpc) {
     async readdir (path = '/', opts = {}) {
       var errStack = (new Error()).stack
       try {
-        var url = await this[URL_PROMISE]
-        var names = await datRPC.readdir(url, path, opts)
+        var names = await datRPC.readdir(this.url, path, opts)
         if (opts.stat) {
           names.forEach(name => { name.stat = new Stat(name.stat) })
         }
@@ -238,8 +217,7 @@ exports.setup = function (rpc) {
     async mkdir (path, opts = {}) {
       var errStack = (new Error()).stack
       try {
-        var url = await this[URL_PROMISE]
-        return await datRPC.mkdir(url, path, opts)
+        return await datRPC.mkdir(this.url, path, opts)
       } catch (e) {
         throwWithFixedStack(e, errStack)
       }
@@ -248,8 +226,7 @@ exports.setup = function (rpc) {
     async rmdir (path, opts = {}) {
       var errStack = (new Error()).stack
       try {
-        var url = await this[URL_PROMISE]
-        return await datRPC.rmdir(url, path, opts)
+        return await datRPC.rmdir(this.url, path, opts)
       } catch (e) {
         throwWithFixedStack(e, errStack)
       }

From f885f1890dc876804f77e8fbba85fa4eef5c86d3 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 15 Jul 2019 10:06:40 -0500
Subject: [PATCH 215/245] Fix: dont return null records from follow read calls

---
 crawler/follows.js | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/crawler/follows.js b/crawler/follows.js
index 51eb5394..cd5384c8 100644
--- a/crawler/follows.js
+++ b/crawler/follows.js
@@ -197,7 +197,7 @@ const list = exports.list = async function (opts) {
   var rows = await db.all(sql)
 
   // massage results
-  return Promise.all(rows.map(async (row) => {
+  return (await Promise.all(rows.map(async (row) => {
     var author = toOrigin(row.authorUrl)
     var topic = toOrigin(row.destUrl)
     return {
@@ -205,7 +205,7 @@ const list = exports.list = async function (opts) {
       topic: await siteDescriptions.getBest({subject: topic}),
       visibility: 'public'
     }
-  }))
+  }))).filter(record => !!record.author && !!record.topic)
 }
 
 /**
@@ -226,11 +226,13 @@ const get = exports.get = async function (author, topic) {
     .where('crawl_sources.url', author)
     .where('crawl_follows.destUrl', topic))
   if (!res) return null
-  return {
+  var record = {
     author: await siteDescriptions.getBest({subject: toOrigin(res.authorUrl)}),
     topic: await siteDescriptions.getBest({subject: toOrigin(res.destUrl)}),
     visibility: 'public'
   }
+  if (!record.author || !record.topic) return null
+  return record
 }
 
 /**

From fcc18a0d03a544a8a91d04b9fcb58be281f70f0a Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 15 Jul 2019 10:07:37 -0500
Subject: [PATCH 216/245] Small crawler fixes

---
 crawler/index.js             | 15 +++++++++------
 crawler/site-descriptions.js |  2 +-
 2 files changed, 10 insertions(+), 7 deletions(-)

diff --git a/crawler/index.js b/crawler/index.js
index 4b92bd1b..b96c7e91 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -85,13 +85,11 @@ exports.crawlSite = async function (archive) {
   crawlerEvents.emit('crawl-start', {sourceUrl: archive.url})
   var release = await lock('crawl:' + archive.url)
   try {
-    // use DNS only on non-local archives
-    const useDns = !archive.writable
-    var url = useDns ? archive.url : `dat://${archive.key.toString('hex')}`
+    var url = archive.url
 
     // fetch current dns record
     var datDnsRecord = null
-    if (useDns && archive.dnsName) {
+    if (archive.dnsName) {
       datDnsRecord = await db.get(knex('dat_dns').where({name: archive.dnsName, isCurrent: 1}))
     }
 
@@ -175,8 +173,13 @@ exports.getCrawlStates = async function () {
 
 const resetSite =
 exports.resetSite = async function (url) {
-  logger.debug('Resetting site', {details: {url}})
-  await db.run(`DELETE FROM crawl_sources WHERE url = ?`, [url])
+  var release = await lock('crawl:' + url)
+  try {
+    logger.debug('Resetting site', {details: {url}})
+    await db.run(`DELETE FROM crawl_sources WHERE url = ?`, [url])
+  } finally {
+    release()
+  }
 }
 
 exports.WEBAPI = {
diff --git a/crawler/site-descriptions.js b/crawler/site-descriptions.js
index cdae65de..ba392329 100644
--- a/crawler/site-descriptions.js
+++ b/crawler/site-descriptions.js
@@ -75,7 +75,7 @@ exports.crawlSite = async function (archive, crawlSource) {
     // collect changed site descriptions
     var changedSiteDescriptions = getMatchingChangesInOrder(changes, JSON_PATH_REGEX)
     if (changedSiteDescriptions.length > 0) {
-      logger.verbose('Collected new/changed site-description files', {details: {url: archive.url, changedPosts: changedSiteDescriptions.map(p => p.name)}})
+      logger.verbose('Collected new/changed site-description files', {details: {url: archive.url, changedFiles: changedSiteDescriptions.map(p => p.name)}})
     } else {
       logger.debug('No new site-description files found', {details: {url: archive.url}})
     }

From ad8b2562627ebaf5a27171617495c48833e439b8 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 15 Jul 2019 10:08:07 -0500
Subject: [PATCH 217/245] Tolerate DNS names in more dat library codepaths

---
 dat/library.js  | 16 ++++++++--------
 dbs/archives.js |  2 +-
 2 files changed, 9 insertions(+), 9 deletions(-)

diff --git a/dat/library.js b/dat/library.js
index 81cfe60b..e7f89b19 100644
--- a/dat/library.js
+++ b/dat/library.js
@@ -341,7 +341,7 @@ const loadArchive = exports.loadArchive = async function loadArchive (key, userS
   if (key) {
     if (!Buffer.isBuffer(key)) {
       // existing dat
-      key = fromURLToKey(key)
+      key = await fromURLToKey(key, true)
       if (!DAT_HASH_REGEX.test(key)) {
         throw new InvalidURLError()
       }
@@ -462,7 +462,7 @@ exports.getActiveArchives = function getActiveArchives () {
 }
 
 const getOrLoadArchive = exports.getOrLoadArchive = async function getOrLoadArchive (key, opts) {
-  key = fromURLToKey(key)
+  key = await fromURLToKey(key, true)
   var archive = getArchive(key)
   if (archive) {
     return archive
@@ -471,7 +471,7 @@ const getOrLoadArchive = exports.getOrLoadArchive = async function getOrLoadArch
 }
 
 exports.unloadArchive = async function unloadArchive (key) {
-  key = fromURLToKey(key)
+  key = await fromURLToKey(key, true)
   var archive = archives[key]
   if (!archive) return
   if (archive.fileActStream) {
@@ -562,7 +562,7 @@ exports.getArchiveInfo = async function getArchiveInfo (key) {
 }
 
 exports.getArchiveNetworkStats = async function getArchiveNetworkStats (key) {
-  key = fromURLToKey(key)
+  key = await fromURLToKey(key, true)
   return daemon.getArchiveNetworkStats(key)
 }
 
@@ -646,10 +646,10 @@ function fixStatObject (st) {
 }
 
 /**
- * 
- * @param {string|Buffer} key 
- * @param {number} version 
- * @param {Object} archiveInfo 
+ *
+ * @param {string|Buffer} key
+ * @param {number} version
+ * @param {Object} archiveInfo
  * @returns {InternalDatArchive}
  */
 function createArchiveProxy (key, version, archiveInfo) {
diff --git a/dbs/archives.js b/dbs/archives.js
index 9187bbe7..eaf3d956 100644
--- a/dbs/archives.js
+++ b/dbs/archives.js
@@ -501,7 +501,7 @@ const getMeta = exports.getMeta = async function (key) {
 
   // validate inputs
   if (!DAT_HASH_REGEX.test(keyStr)) {
-    throw new InvalidArchiveKeyError()
+    keyStr = await require('../dat/dns').resolveName(keyStr)
   }
 
   // fetch

From 1889f4fb7e7057f779cd638cf5a9bda511569115 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 15 Jul 2019 10:08:31 -0500
Subject: [PATCH 218/245] Correctly handle timeouts during crawling

---
 users/index.js | 38 ++++++++++++++++++++++----------------
 1 file changed, 22 insertions(+), 16 deletions(-)

diff --git a/users/index.js b/users/index.js
index 37ec3a4b..4fe79a44 100644
--- a/users/index.js
+++ b/users/index.js
@@ -16,6 +16,7 @@ const _pick = require('lodash.pick')
 
 const CRAWL_TICK_INTERVAL = 5e3
 const NUM_SIMULTANEOUS_CRAWLS = 10
+const CRAWL_TIMEOUT = 15e3
 const LABEL_REGEX = /[a-z0-9-]/i
 
 // typedefs
@@ -123,28 +124,33 @@ async function tick () {
 
     // trigger the crawls on each
     var activeCrawls = crawlTargets.map(async (crawlTarget) => {
-      try {
-        // load archive
-        var wasLoaded = true // TODO
-        var archive = await dat.library.getOrLoadArchive(crawlTarget) // TODO timeout on load
-
-        // run crawl
-        await crawler.crawlSite(archive)
-
-        if (!wasLoaded) {
-          // unload archive
-          // TODO
-        }
-      } catch (e) {
-        // TODO handle?
-      }
+      await Promise.race([
+        new Promise((resolve, reject) => setTimeout(() => reject(`Crawl timed out for ${crawlTarget}`), CRAWL_TIMEOUT)),
+        (async () => {
+          try {
+            // load archive
+            var wasLoaded = true // TODO
+            var archive = await dat.library.getOrLoadArchive(crawlTarget) // TODO timeout on load
+    
+            // run crawl
+            await crawler.crawlSite(archive)
+    
+            if (!wasLoaded) {
+              // unload archive
+              // TODO
+            }
+          } catch (e) {
+            // TODO handle?
+          }
+        })()
+      ])
     })
 
     // await all crawls
     await Promise.all(activeCrawls)
   } catch (e) {
     console.error(e)
-    logger.error('Crawler tick failed', {details: e})
+    logger.error('Crawler tick errored', {details: e})
   }
 
   // queue next tick

From 2de515dd5dffe644afde27b71f0409d6cc598f0f Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 15 Jul 2019 10:08:41 -0500
Subject: [PATCH 219/245] Use dns name on users

---
 users/index.js                          | 3 +++
 web-apis/bg/unwalled-garden-profiles.js | 2 +-
 2 files changed, 4 insertions(+), 1 deletion(-)

diff --git a/users/index.js b/users/index.js
index 4fe79a44..82357bb0 100644
--- a/users/index.js
+++ b/users/index.js
@@ -89,6 +89,7 @@ exports.setup = async function () {
     // fetch the user archive
     try {
       user.archive = await dat.library.getOrLoadArchive(user.url)
+      user.url = user.archive.url // copy the archive url, which includes the dnsName if set
       startWatch(user)
       events.emit('load-user', user)
     } catch (err) {
@@ -234,6 +235,7 @@ exports.add = async function (label, url, setDefault = false, isTemporary = fals
 
   // fetch the user archive
   user.archive = await dat.library.getOrLoadArchive(user.url)
+  user.url = user.archive.url // copy the archive url, which includes the dnsName if set
   startWatch(user)
   events.emit('load-user', user)
   return fetchUserInfo(user)
@@ -277,6 +279,7 @@ exports.edit = async function (url, opts) {
 
   // fetch the user archive
   user.archive = await dat.library.getOrLoadArchive(user.url)
+  user.url = user.archive.url // copy the archive url, which includes the dnsName if set
   return fetchUserInfo(user)
 }
 
diff --git a/web-apis/bg/unwalled-garden-profiles.js b/web-apis/bg/unwalled-garden-profiles.js
index 58d2d4c4..8bad58d6 100644
--- a/web-apis/bg/unwalled-garden-profiles.js
+++ b/web-apis/bg/unwalled-garden-profiles.js
@@ -24,7 +24,7 @@ async function get (url) {
   var archive = /** @type LibraryArchiveRecord */(await datLibrary.queryArchives({key}))
   if (!archive) return null
   return {
-    url: toOrigin(url),
+    url: toOrigin(archive.url),
     title: archive.title,
     description: archive.description,
     type: archive.type

From 1b0d96b28960f71fcf73be26f2ed3a0a78c0bb98 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 15 Jul 2019 18:55:25 -0500
Subject: [PATCH 220/245] Track the 'primary url' (assigned domain in manifest)
 more closely and use in all internal records

---
 crawler/bookmarks.js         | 16 ++--------
 crawler/comments.js          |  7 ++--
 crawler/discussions.js       |  5 +--
 crawler/follows.js           | 24 ++++++++------
 crawler/index.js             | 12 +++----
 crawler/posts.js             |  5 +--
 crawler/reactions.js         |  7 ++--
 crawler/site-descriptions.js | 13 ++------
 crawler/tags.js              |  9 +++---
 crawler/votes.js             |  9 +++---
 dat/dns.js                   |  3 +-
 dat/library.js               | 62 +++++++++++++++++++++++++++++++-----
 dbs/archives.js              |  6 ++--
 dbs/dat-dns.js               | 26 +++++++++++++--
 lib/app-perms.js             | 19 ++++-------
 users/index.js               | 22 ++++++++++---
 web-apis/bg/applications.js  | 21 ++++++++----
 web-apis/bg/dat-archive.js   |  2 +-
 web-apis/bg/navigator.js     |  2 +-
 19 files changed, 172 insertions(+), 98 deletions(-)

diff --git a/crawler/bookmarks.js b/crawler/bookmarks.js
index 5be19075..3c28f72b 100644
--- a/crawler/bookmarks.js
+++ b/crawler/bookmarks.js
@@ -4,6 +4,7 @@ const Events = require('events')
 const Ajv = require('ajv')
 const logger = require('../logger').child({category: 'crawler', dataset: 'bookmarks'})
 const db = require('../dbs/profile-data-db')
+const datLibrary = require('../dat/library')
 const knex = require('../lib/knex')
 const crawler = require('./index')
 const siteDescriptions = require('./site-descriptions')
@@ -179,7 +180,7 @@ exports.query = async function (opts) {
         assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
         opts.filters.authors = [opts.filters.authors]
       }
-      opts.filters.authors = opts.filters.authors.map(toAuthorOrigin)
+      opts.filters.authors = await Promise.all(opts.filters.authors.map(datLibrary.getPrimaryUrl))
     }
     if ('tags' in opts.filters) {
       if (Array.isArray(opts.filters.tags)) {
@@ -340,19 +341,6 @@ exports.deleteBookmark = async function (archive, pathname) {
 // internal methods
 // =
 
-/**
- * @param {string} url
- * @returns {string}
- */
-function toAuthorOrigin (url) {
-  try {
-    var urlParsed = new URL(url)
-    return urlParsed.protocol + '//' + urlParsed.hostname
-  } catch (e) {
-    throw new Error('Invalid URL: ' + url)
-  }
-}
-
 /**
  * @param {string} origin
  * @param {string} pathname
diff --git a/crawler/comments.js b/crawler/comments.js
index 6319438e..ddae39ea 100644
--- a/crawler/comments.js
+++ b/crawler/comments.js
@@ -5,10 +5,11 @@ const Ajv = require('ajv')
 const logger = require('../logger').child({category: 'crawler', dataset: 'comments'})
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
+const datLibrary = require('../dat/library')
 const lock = require('../lib/lock')
 const knex = require('../lib/knex')
 const siteDescriptions = require('./site-descriptions')
-const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename, ensureDirectory, normalizeTopicUrl, toOrigin} = require('./util')
+const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename, ensureDirectory, normalizeTopicUrl} = require('./util')
 const commentSchema = require('./json-schemas/comment')
 
 // constants
@@ -192,7 +193,7 @@ exports.list = async function (opts) {
         assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
         opts.filters.authors = [opts.filters.authors]
       }
-      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+      opts.filters.authors = await Promise.all(opts.filters.authors.map(datLibrary.getPrimaryUrl))
     }
     if ('topics' in opts.filters) {
       if (Array.isArray(opts.filters.topics)) {
@@ -264,7 +265,7 @@ exports.thread = async function (topic, opts) {
         assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
         opts.filters.authors = [opts.filters.authors]
       }
-      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+      opts.filters.authors = await Promise.all(opts.filters.authors.map(datLibrary.getPrimaryUrl))
     }
     if ('visibility' in opts.filters) {
       assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
diff --git a/crawler/discussions.js b/crawler/discussions.js
index a4b99002..f6b7e2e0 100644
--- a/crawler/discussions.js
+++ b/crawler/discussions.js
@@ -5,10 +5,11 @@ const Ajv = require('ajv')
 const logger = require('../logger').child({category: 'crawler', dataset: 'discussions'})
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
+const datLibrary = require('../dat/library')
 const lock = require('../lib/lock')
 const knex = require('../lib/knex')
 const siteDescriptions = require('./site-descriptions')
-const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename, ensureDirectory, toOrigin} = require('./util')
+const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename, ensureDirectory} = require('./util')
 const discussionSchema = require('./json-schemas/discussion')
 
 // constants
@@ -213,7 +214,7 @@ exports.list = async function (opts) {
         assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
         opts.filters.authors = [opts.filters.authors]
       }
-      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+      opts.filters.authors = await Promise.all(opts.filters.authors.map(datLibrary.getPrimaryUrl))
     }
     if ('tags' in opts.filters) {
       if (Array.isArray(opts.filters.tags)) {
diff --git a/crawler/follows.js b/crawler/follows.js
index cd5384c8..1ba5bdd7 100644
--- a/crawler/follows.js
+++ b/crawler/follows.js
@@ -8,6 +8,7 @@ const lock = require('../lib/lock')
 const knex = require('../lib/knex')
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
+const datLibrary = require('../dat/library')
 const siteDescriptions = require('./site-descriptions')
 const {doCrawl, doCheckpoint, emitProgressEvent} = require('./util')
 const followsSchema = require('./json-schemas/follows')
@@ -90,8 +91,13 @@ exports.crawlSite = async function (archive, crawlSource) {
     }
 
     // diff against the current follows
-    var currentFollowObjects = await list({filters: {authors: archive.url}})
-    var currentFollows = currentFollowObjects.map(({topic}) => topic.url)
+    var currentFollowRows = await db.all(
+      knex('crawl_follows')
+        .select('crawl_follows.*')
+        .innerJoin('crawl_sources', 'crawl_sources.id', '=', 'crawl_follows.crawlSourceId')
+        .where('crawl_sources.url', archive.url)
+    )
+    var currentFollows = currentFollowRows.map(({destUrl}) => destUrl)
     var newFollows = followsJson.urls
     var adds = _difference(newFollows, currentFollows)
     var removes = _difference(currentFollows, newFollows)
@@ -164,7 +170,7 @@ const list = exports.list = async function (opts) {
         assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
         opts.filters.authors = [opts.filters.authors]
       }
-      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url))
+      opts.filters.authors = await Promise.all(opts.filters.authors.map(datLibrary.getPrimaryUrl))
     }
     if ('topics' in opts.filters) {
       if (Array.isArray(opts.filters.topics)) {
@@ -173,7 +179,7 @@ const list = exports.list = async function (opts) {
         assert(typeof opts.filters.topics === 'string', 'Topics filter must be a string or array of strings')
         opts.filters.topics = [opts.filters.topics]
       }
-      opts.filters.topics = opts.filters.topics.map(url => toOrigin(url))
+      opts.filters.topics = await Promise.all(opts.filters.topics.map(datLibrary.getPrimaryUrl))
     }
     if ('visibility' in opts.filters) {
       assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
@@ -217,8 +223,8 @@ const list = exports.list = async function (opts) {
  * @returns {Promise<Follow>}
  */
 const get = exports.get = async function (author, topic) {
-  author = toOrigin(author)
-  topic = toOrigin(topic)
+  author = await datLibrary.getPrimaryUrl(author)
+  topic = await datLibrary.getPrimaryUrl(topic)
   var res = await db.get(knex('crawl_follows')
     .select('crawl_follows.*')
     .select('crawl_sources.url AS authorUrl')
@@ -249,7 +255,7 @@ exports.add = async function (archive, topic, opts) {
   // TODO visibility
 
   // normalize topic
-  topic = toOrigin(topic)
+  topic = await datLibrary.getPrimaryUrl(topic)
   assert(typeof topic === 'string', 'Follow() must be given a valid URL')
 
   // write new follows.json
@@ -277,7 +283,7 @@ exports.edit = async function (archive, topic, opts) {
   // TODO visibility
 
   // normalize topic
-  topic = toOrigin(topic)
+  topic = await datLibrary.getPrimaryUrl(topic)
   assert(typeof topic === 'string', 'Follow() must be given a valid URL')
 
   // write new follows.json
@@ -300,7 +306,7 @@ exports.remove = async function (archive, topic) {
   // TODO private follows
 
   // normalize topic
-  topic = toOrigin(topic)
+  topic = await datLibrary.getPrimaryUrl(topic)
   assert(typeof topic === 'string', 'Unfollow() must be given a valid URL')
 
   // write new follows.json
diff --git a/crawler/index.js b/crawler/index.js
index b96c7e91..dc697119 100644
--- a/crawler/index.js
+++ b/crawler/index.js
@@ -6,6 +6,7 @@ const knex = require('../lib/knex')
 const db = require('../dbs/profile-data-db')
 const archivesDb = require('../dbs/archives')
 const dat = require('../dat')
+const users = require('../users')
 
 const {crawlerEvents, toHostname} = require('./util')
 const bookmarks = require('./bookmarks')
@@ -68,6 +69,7 @@ exports.watchSite = async function (archive) {
 
 exports.unwatchSite = async function (url) {
   // stop watching for file changes
+  url = await dat.library.getPrimaryUrl(url)
   if (url in watches) {
     logger.silly('Unwatching site', {url})
     crawlerEvents.emit('unwatch', {sourceUrl: url})
@@ -89,8 +91,8 @@ exports.crawlSite = async function (archive) {
 
     // fetch current dns record
     var datDnsRecord = null
-    if (archive.dnsName) {
-      datDnsRecord = await db.get(knex('dat_dns').where({name: archive.dnsName, isCurrent: 1}))
+    if (archive.domain) {
+      datDnsRecord = await db.get(knex('dat_dns').where({name: archive.domain, isCurrent: 1}))
     }
 
     // get/create crawl source
@@ -173,6 +175,7 @@ exports.getCrawlStates = async function () {
 
 const resetSite =
 exports.resetSite = async function (url) {
+  url = await dat.library.getPrimaryUrl(url)
   var release = await lock('crawl:' + url)
   try {
     logger.debug('Resetting site', {details: {url}})
@@ -186,9 +189,6 @@ exports.WEBAPI = {
   listSuggestions: require('./search').listSuggestions,
   createEventsStream,
   getCrawlStates,
-  crawlSite: async (url) => {
-    var archive = await dat.library.getOrLoadArchive(url)
-    return crawlSite(archive)
-  },
+  crawlSite,
   resetSite
 }
\ No newline at end of file
diff --git a/crawler/posts.js b/crawler/posts.js
index 303bf91a..d7a93f59 100644
--- a/crawler/posts.js
+++ b/crawler/posts.js
@@ -5,10 +5,11 @@ const Ajv = require('ajv')
 const logger = require('../logger').child({category: 'crawler', dataset: 'posts'})
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
+const datLibrary = require('../dat/library')
 const lock = require('../lib/lock')
 const knex = require('../lib/knex')
 const siteDescriptions = require('./site-descriptions')
-const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename, ensureDirectory, toOrigin} = require('./util')
+const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, generateTimeFilename, ensureDirectory} = require('./util')
 const postSchema = require('./json-schemas/post')
 
 // constants
@@ -175,7 +176,7 @@ exports.list = async function (opts) {
         assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
         opts.filters.authors = [opts.filters.authors]
       }
-      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+      opts.filters.authors = await Promise.all(opts.filters.authors.map(datLibrary.getPrimaryUrl))
     }
     if ('visibility' in opts.filters) {
       assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
diff --git a/crawler/reactions.js b/crawler/reactions.js
index 0cdfdc54..96920183 100644
--- a/crawler/reactions.js
+++ b/crawler/reactions.js
@@ -5,9 +5,10 @@ const Ajv = require('ajv')
 const logger = require('../logger').child({category: 'crawler', dataset: 'reactions'})
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
+const datLibrary = require('../dat/library')
 const lock = require('../lib/lock')
 const knex = require('../lib/knex')
-const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, ensureDirectory, toOrigin, normalizeTopicUrl, slugifyUrl} = require('./util')
+const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, ensureDirectory, normalizeTopicUrl, slugifyUrl} = require('./util')
 const reactionSchema = require('./json-schemas/reaction')
 
 // constants
@@ -165,7 +166,7 @@ exports.list = async function (opts) {
         assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
         opts.filters.authors = [opts.filters.authors]
       }
-      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+      opts.filters.authors = await Promise.all(opts.filters.authors.map(datLibrary.getPrimaryUrl))
     }
     if ('topics' in opts.filters) {
       if (Array.isArray(opts.filters.topics)) {
@@ -231,7 +232,7 @@ exports.tabulate = async function (topic, opts) {
         assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
         opts.filters.authors = [opts.filters.authors]
       }
-      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+      opts.filters.authors = await Promise.all(opts.filters.authors.map(datLibrary.getPrimaryUrl))
     }
     if ('visibility' in opts.filters) {
       assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
diff --git a/crawler/site-descriptions.js b/crawler/site-descriptions.js
index ba392329..6011815f 100644
--- a/crawler/site-descriptions.js
+++ b/crawler/site-descriptions.js
@@ -169,12 +169,12 @@ const list = exports.list = async function ({offset, limit, reverse, author, sub
 
   if (author) {
     author = Array.isArray(author) ? author : [author]
-    try { author = author.map(toOrigin) }
+    try { author = await Promise.all(author.map(dat.library.getPrimaryUrl)) }
     catch (e) { throw new Error('Author must contain valid URLs') }
   }
   if (subject) {
     subject = Array.isArray(subject) ? subject : [subject]
-    try { subject = subject.map(toOrigin) }
+    try { subject = await Promise.all(subject.map(dat.library.getPrimaryUrl)) }
     catch (e) { throw new Error('Subject must contain valid URLs') }
   }
 
@@ -317,15 +317,6 @@ function isString (v) {
   return typeof v === 'string'
 }
 
-/**
- * @param {string} url
- * @returns {string}
- */
-function toOrigin (url) {
-  var urlParsed = new URL(url)
-  return urlParsed.protocol + '//' + urlParsed.hostname
-}
-
 /**
  * @param {InternalDatArchive} archive
  * @param {string} name
diff --git a/crawler/tags.js b/crawler/tags.js
index 1da8c5dc..0aadb130 100644
--- a/crawler/tags.js
+++ b/crawler/tags.js
@@ -2,7 +2,8 @@ const assert = require('assert')
 const {URL} = require('url')
 const db = require('../dbs/profile-data-db')
 const knex = require('../lib/knex')
-const {normalizeSchemaUrl, toOrigin} = require('./util')
+const datLibrary = require('../dat/library')
+const {normalizeSchemaUrl} = require('./util')
 
 // typedefs
 // =
@@ -51,7 +52,7 @@ exports.listBookmarkTags = async function (opts) {
         assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
         opts.filters.authors = [opts.filters.authors]
       }
-      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+      opts.filters.authors = await Promise.all(opts.filters.authors.map(datLibrary.getPrimaryUrl))
     }
     if ('visibility' in opts.filters) {
       assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
@@ -112,7 +113,7 @@ exports.listDiscussionTags = async function (opts) {
         assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
         opts.filters.authors = [opts.filters.authors]
       }
-      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+      opts.filters.authors = await Promise.all(opts.filters.authors.map(datLibrary.getPrimaryUrl))
     }
     if ('visibility' in opts.filters) {
       assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
@@ -174,7 +175,7 @@ exports.listMediaTags = async function (opts) {
         assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
         opts.filters.authors = [opts.filters.authors]
       }
-      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+      opts.filters.authors = await Promise.all(opts.filters.authors.map(datLibrary.getPrimaryUrl))
     }
     if ('subtypes' in opts.filters) {
       if (Array.isArray(opts.filters.subtypes)) {
diff --git a/crawler/votes.js b/crawler/votes.js
index f13a6ede..d5d46b7f 100644
--- a/crawler/votes.js
+++ b/crawler/votes.js
@@ -5,9 +5,10 @@ const Ajv = require('ajv')
 const logger = require('../logger').child({category: 'crawler', dataset: 'votes'})
 const db = require('../dbs/profile-data-db')
 const crawler = require('./index')
+const datLibrary = require('../dat/library')
 const knex = require('../lib/knex')
 const siteDescriptions = require('./site-descriptions')
-const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, ensureDirectory, toOrigin, normalizeTopicUrl, generateTimeFilename} = require('./util')
+const {doCrawl, doCheckpoint, emitProgressEvent, getMatchingChangesInOrder, ensureDirectory, normalizeTopicUrl, generateTimeFilename} = require('./util')
 const voteSchema = require('./json-schemas/vote')
 
 // constants
@@ -182,7 +183,7 @@ exports.list = async function (opts) {
         assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
         opts.filters.authors = [opts.filters.authors]
       }
-      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+      opts.filters.authors = await Promise.all(opts.filters.authors.map(datLibrary.getPrimaryUrl))
     }
     if ('topics' in opts.filters) {
       if (Array.isArray(opts.filters.topics)) {
@@ -243,7 +244,7 @@ exports.tabulate = async function (topic, opts) {
         assert(typeof opts.filters.authors === 'string', 'Authors filter must be a string or array of strings')
         opts.filters.authors = [opts.filters.authors]
       }
-      opts.filters.authors = opts.filters.authors.map(url => toOrigin(url, true))
+      opts.filters.authors = await Promise.all(opts.filters.authors.map(datLibrary.getPrimaryUrl))
     }
     if ('visibility' in opts.filters) {
       assert(typeof opts.filters.visibility === 'string', 'Visibility filter must be a string')
@@ -291,7 +292,7 @@ exports.tabulate = async function (topic, opts) {
  * @returns {Promise<Vote>}
  */
 const get = exports.get = async function (author, topic) {
-  author = toOrigin(author, true)
+  author = await datLibrary.getPrimaryUrl(author)
   topic = normalizeTopicUrl(topic)
 
   // execute query
diff --git a/dat/dns.js b/dat/dns.js
index 5767b815..2fc64fa9 100644
--- a/dat/dns.js
+++ b/dat/dns.js
@@ -1,6 +1,7 @@
 const parseDatURL = require('parse-dat-url')
 const {InvalidDomainName} = require('beaker-error-constants')
 const datDnsDb = require('../dbs/dat-dns')
+const library = require('./library')
 const {DAT_HASH_REGEX} = require('../lib/const')
 const logger = require('../logger').child({category: 'dat', subcategory: 'dns'})
 
@@ -33,5 +34,5 @@ async function read (name, err) {
 }
 async function write (name, key) {
   if (DAT_HASH_REGEX.test(name)) return // dont write for raw urls
-  await datDnsDb.update({name, key})
+  await library.confirmDomain(key)
 }
diff --git a/dat/library.js b/dat/library.js
index e7f89b19..8208cda6 100644
--- a/dat/library.js
+++ b/dat/library.js
@@ -39,7 +39,7 @@ const DAT_DAEMON_MANIFEST = require('./daemon/manifest')
  * @typedef {Object} InternalDatArchive
  * @prop {Buffer} key
  * @prop {string} url
- * @prop {string?} dnsName
+ * @prop {string?} domain
  * @prop {Buffer} discoveryKey
  * @prop {boolean} writable
  * @prop {function(Function): void} ready
@@ -136,7 +136,7 @@ exports.setup = async function setup ({rpcAPI, datDaemonProcess, disallowedSaveP
   datDnsDb.on('update', ({key, name}) => {
     var archive = getArchive(key)
     if (archive) {
-      archive.dnsName = name
+      archive.domain = name
     }
   })
 
@@ -219,6 +219,9 @@ const pullLatestArchiveMeta = exports.pullLatestArchiveMeta = async function pul
     // ready() just in case (we need .blocks)
     await pify(archive.ready.bind(archive))()
 
+    // trigger DNS update
+    confirmDomain(key)
+
     // read the archive meta and size on disk
     var [manifest, oldMeta, size] = await Promise.all([
       archive.pda.readManifest().catch(_ => {}),
@@ -405,7 +408,7 @@ async function loadArchiveInner (key, secretKey, userSettings = null) {
 
   // fetch dns name if known
   let dnsRecord = await datDnsDb.getCurrentByKey(datEncoding.toStr(key))
-  archive.dnsName = dnsRecord ? dnsRecord.name : undefined
+  archive.domain = dnsRecord ? dnsRecord.name : undefined
 
   // update db
   archivesDb.touch(key).catch(err => console.error('Failed to update lastAccessTime for archive', key, err))
@@ -444,13 +447,13 @@ exports.getArchiveCheckout = function getArchiveCheckout (archive, version) {
       } else if (version === 'preview') {
         isPreview = true
         checkoutFS = createArchiveProxy(archive.key, 'preview', archive)
-        checkoutFS.dnsName = archive.dnsName
+        checkoutFS.domain = archive.domain
       } else {
         throw new Error('Invalid version identifier:' + version)
       }
     } else {
       checkoutFS = createArchiveProxy(archive.key, version, archive)
-      checkoutFS.dnsName = archive.dnsName
+      checkoutFS.domain = archive.domain
       isHistoric = true
     }
   }
@@ -538,7 +541,7 @@ exports.getArchiveInfo = async function getArchiveInfo (key) {
   manifest = manifest || {}
   meta.key = key
   meta.url = archive.url
-  meta.dnsName = archive.dnsName
+  meta.domain = archive.domain
   meta.links = manifest.links || {}
   meta.manifest = manifest
   meta.version = archiveInfo.version
@@ -571,6 +574,49 @@ exports.clearFileCache = async function clearFileCache (key) {
   return daemon.clearFileCache(key, userSettings)
 }
 
+/**
+ * @desc
+ * Get the primary URL for a given dat URL
+ *
+ * @param {string} url
+ * @returns {Promise<string>}
+ */
+const getPrimaryUrl = exports.getPrimaryUrl = async function (url) {
+  var key = await fromURLToKey(url, true)
+  var datDnsRecord = await datDnsDb.getCurrentByKey(key)
+  if (!datDnsRecord) return `dat://${key}`
+  return `dat://${datDnsRecord.name}`
+}
+
+/**
+ * @desc
+ * Check that the archive's dat.json `domain` matches the current DNS
+ * If yes, write the confirmed entry to the dat_dns table
+ *
+ * @param {string} key
+ * @returns {Promise<boolean>}
+ */
+const confirmDomain = exports.confirmDomain = async function (key) {
+  // fetch the current domain from the manifest
+  var archive = await getOrLoadArchive(key)
+  var datJson = await archive.pda.readManifest()
+  if (!datJson.domain) {
+    await datDnsDb.unset(key)
+    return false
+  }
+
+  // confirm match with current DNS
+  var dnsKey = await require('./dns').resolveName(datJson.domain)
+  if (key !== dnsKey) {
+    await datDnsDb.unset(key)
+    return false
+  }
+
+  // update mapping
+  await datDnsDb.update({name: datJson.domain, key})
+  return true
+}
+
 // helpers
 // =
 
@@ -659,9 +705,9 @@ function createArchiveProxy (key, version, archiveInfo) {
   return {
     key: datEncoding.toBuf(key),
     get url () {
-      return `dat://${this.dnsName || key}${version ? '+' + version : ''}`
+      return `dat://${this.domain || key}${version ? '+' + version : ''}`
     },
-    dnsName: undefined,
+    domain: undefined,
     discoveryKey: datEncoding.toBuf(archiveInfo.discoveryKey),
     writable: archiveInfo.writable,
 
diff --git a/dbs/archives.js b/dbs/archives.js
index eaf3d956..0c320592 100644
--- a/dbs/archives.js
+++ b/dbs/archives.js
@@ -21,7 +21,7 @@ const {
  * @typedef {Object} LibraryArchiveRecord
  * @prop {string} key
  * @prop {string} url
- * @prop {string?} dnsName
+ * @prop {string?} domain
  * @prop {string} title
  * @prop {string} description
  * @prop {Array<string>} type
@@ -204,7 +204,7 @@ exports.query = async function (profileId, query = {}) {
         archives.expiresAt,
         archives.localSyncPath,
         archives.previewMode,
-        dat_dns.name as dnsName
+        dat_dns.name as domain
       FROM archives_meta
       LEFT JOIN archives ON archives.key = archives_meta.key
       LEFT JOIN archives_meta_type ON archives_meta_type.key = archives_meta.key
@@ -215,7 +215,7 @@ exports.query = async function (profileId, query = {}) {
 
   // massage the output
   archives.forEach(archive => {
-    archive.url = `dat://${archive.dnsName || archive.key}`
+    archive.url = `dat://${archive.domain || archive.key}`
     archive.isOwner = archive.isOwner != 0
     archive.type = archive.type ? archive.type.split(',') : []
     archive.userSettings = {
diff --git a/dbs/dat-dns.js b/dbs/dat-dns.js
index 4631514d..19a303e3 100644
--- a/dbs/dat-dns.js
+++ b/dbs/dat-dns.js
@@ -40,7 +40,7 @@ exports.getCurrentByName = async function (name) {
  * @returns {Promise<DatDnsRecord>}
  */
 exports.getCurrentByKey = async function (key) {
-  return massageDNSRecord(await db.get(knex('dat_dns').where({key, isCurrent: 1}).orderBy('name')))
+  return massageDNSRecord(await db.get(knex('dat_dns').where({key, isCurrent: 1})))
 }
 
 /**
@@ -52,9 +52,16 @@ exports.getCurrentByKey = async function (key) {
 exports.update = async function ({key, name}) {
   var release = await lock('dat-dns-update:' + name)
   try {
+    var old = await db.get(knex('dat_dns').where({name, isCurrent: 1}))
+    if (old && old.key !== key) {
+      // unset old
+      await db.run(knex('dat_dns').update({isCurrent: 0}).where({name}))
+      events.emit('update', {key: old.key, name: undefined})
+    }
+
     let curr = await db.get(knex('dat_dns').where({name, key}))
     if (!curr) {
-      await db.run(knex('dat_dns').update({isCurrent: 0}).where({name}))
+      // insert new
       await db.run(knex('dat_dns').insert({
         name,
         key,
@@ -63,7 +70,8 @@ exports.update = async function ({key, name}) {
         firstConfirmedAt: Date.now()
       }))
     } else {
-      await db.run(knex('dat_dns').update({lastConfirmedAt: Date.now()}).where({name, key}))
+      // update current
+      await db.run(knex('dat_dns').update({lastConfirmedAt: Date.now(), isCurrent: 1}).where({name, key}))
     }
     events.emit('update', {key, name})
   } finally {
@@ -71,6 +79,18 @@ exports.update = async function ({key, name}) {
   }
 }
 
+/**
+ * @param {string} key
+ * @returns {Promise<void>}
+ */
+exports.unset = async function (key) {
+  var curr = await db.get(knex('dat_dns').where({key, isCurrent: 1}))
+  if (curr) {
+    await db.run(knex('dat_dns').update({isCurrent: 0}).where({key}))
+    events.emit('update', {key, name: undefined})
+  }
+}
+
 // internal methods
 // =
 
diff --git a/lib/app-perms.js b/lib/app-perms.js
index d4d5fa5e..4faa52cb 100644
--- a/lib/app-perms.js
+++ b/lib/app-perms.js
@@ -1,8 +1,9 @@
 const {URL} = require('url')
-const dat = require('../dat')
 const sitedataDb = require('../dbs/sitedata')
 const globals = require('../globals')
 const knex = require('../lib/knex')
+const users = require('../users')
+const datLibrary = require('../dat/library')
 const { ucfirst } = require('../lib/strings')
 const db = require('../dbs/profile-data-db')
 const { PermissionsError } = require('beaker-error-constants')
@@ -10,22 +11,16 @@ const { PermissionsError } = require('beaker-error-constants')
 const getSessionUserId = exports.getSessionUserId = async function (sender) {
   var userSession = globals.userSessionAPI.getFor(sender)
   if (!userSession) throw new Error('No active user session')
-  var record = await db.get(knex('users').where({url: userSession.url}))
-  return record.id
+  return (await users.get(userSession.url)).id
 }
 
 /**
  * @param {string} url
  * @returns {Promise<string>}
  */
-const toDatOrigin = exports.toDatOrigin = async function (url) {
-  try {
-    var urlParsed = new URL(url)
-  } catch (e) {
-    throw new Error('Invalid URL: ' + url)
-  }
-  if (urlParsed.protocol !== 'dat:') throw new Error('Can only install dat applications')
-  return `${urlParsed.protocol}//${urlParsed.hostname}`.replace('+preview', '')
+const toDatOrigin = async function (url) {
+  if (!url.startsWith('dat://')) throw new Error('Can only install dat applications')
+  return datLibrary.getPrimaryUrl(url)
 }
 
 /**
@@ -38,7 +33,7 @@ const can = exports.can = async function (sender, perm, cap) {
   if (sender.getURL().startsWith('beaker:')) {
     return true
   }
-  return (await sitedataDb.getAppPermission(sender.getURL(), perm)).includes(cap)
+  return (await sitedataDb.getAppPermission(await toDatOrigin(sender.getURL()), perm)).includes(cap)
 }
 
 /**
diff --git a/users/index.js b/users/index.js
index 82357bb0..8f35c5c0 100644
--- a/users/index.js
+++ b/users/index.js
@@ -26,6 +26,7 @@ const LABEL_REGEX = /[a-z0-9-]/i
  * @typedef {import('../dat/library').InternalDatArchive} InternalDatArchive
  *
  * @typedef {Object} User
+ * @prop {number} id
  * @prop {string} label
  * @prop {string} url
  * @prop {InternalDatArchive} archive
@@ -89,7 +90,7 @@ exports.setup = async function () {
     // fetch the user archive
     try {
       user.archive = await dat.library.getOrLoadArchive(user.url)
-      user.url = user.archive.url // copy the archive url, which includes the dnsName if set
+      user.url = user.archive.url // copy the archive url, which includes the domain if set
       startWatch(user)
       events.emit('load-user', user)
     } catch (err) {
@@ -132,10 +133,10 @@ async function tick () {
             // load archive
             var wasLoaded = true // TODO
             var archive = await dat.library.getOrLoadArchive(crawlTarget) // TODO timeout on load
-    
+
             // run crawl
             await crawler.crawlSite(archive)
-    
+
             if (!wasLoaded) {
               // unload archive
               // TODO
@@ -198,6 +199,16 @@ exports.getDefault = async function () {
   return fetchUserInfo(user)
 }
 
+/**
+ * @return {string}
+ */
+const getDefaultUrl =
+exports.getDefaultUrl = function () {
+  var user = users.find(user => user.isDefault === true)
+  if (!user) return null
+  return user.url
+}
+
 /**
  * @param {string} label
  * @param {string} url
@@ -235,7 +246,7 @@ exports.add = async function (label, url, setDefault = false, isTemporary = fals
 
   // fetch the user archive
   user.archive = await dat.library.getOrLoadArchive(user.url)
-  user.url = user.archive.url // copy the archive url, which includes the dnsName if set
+  user.url = user.archive.url // copy the archive url, which includes the domain if set
   startWatch(user)
   events.emit('load-user', user)
   return fetchUserInfo(user)
@@ -279,7 +290,7 @@ exports.edit = async function (url, opts) {
 
   // fetch the user archive
   user.archive = await dat.library.getOrLoadArchive(user.url)
-  user.url = user.archive.url // copy the archive url, which includes the dnsName if set
+  user.url = user.archive.url // copy the archive url, which includes the domain if set
   return fetchUserInfo(user)
 }
 
@@ -381,6 +392,7 @@ async function selectNextCrawlTargets (user) {
 async function fetchUserInfo (user) {
   var meta = await archivesDb.getMeta(user.archive.key)
   return {
+    id: user.id,
     label: user.label,
     url: user.archive.url,
     archive: user.archive,
diff --git a/web-apis/bg/applications.js b/web-apis/bg/applications.js
index 881034f6..238700a0 100644
--- a/web-apis/bg/applications.js
+++ b/web-apis/bg/applications.js
@@ -35,7 +35,7 @@ module.exports = {
    * @returns {Promise<WebAPIApplication>}
    */
   async getInfo (url) {
-    url = await appPerms.toDatOrigin(url)
+    url = toDatOrigin(url)
     var userId = await appPerms.getSessionUserId(this.sender)
     var record = await db.get(knex('installed_applications').where({userId, url}))
     var archiveInfo = await dat.library.getArchiveInfo(url)
@@ -47,7 +47,7 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async install (url) {
-    url = await appPerms.toDatOrigin(url)
+    url = toDatOrigin(url)
     var userId = await appPerms.getSessionUserId(this.sender)
     var archiveInfo = await dat.library.getArchiveInfo(url)
     var record = await db.get(knex('installed_applications').where({userId, url}))
@@ -69,7 +69,6 @@ module.exports = {
   async requestInstall (url) {
     // run the install modal
     try {
-      console.log('showing modal')
       return globals.uiAPI.showModal(this.sender, 'install-application', {url})
     } catch (e) {
       console.log('ohno', e)
@@ -97,7 +96,7 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async enable (url) {
-    url = await appPerms.toDatOrigin(url)
+    url = toDatOrigin(url)
     var userId = await appPerms.getSessionUserId(this.sender)
     await db.run(knex('installed_applications').update({enabled: 1}).where({userId, url}))
   },
@@ -107,7 +106,7 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async disable (url) {
-    url = await appPerms.toDatOrigin(url)
+    url = toDatOrigin(url)
     var userId = await appPerms.getSessionUserId(this.sender)
     await db.run(knex('installed_applications').update({enabled: 0}).where({userId, url}))
   },
@@ -117,7 +116,7 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async uninstall (url) {
-    url = await appPerms.toDatOrigin(url)
+    url = toDatOrigin(url)
     var userId = await appPerms.getSessionUserId(this.sender)
     await sitedataDb.setAppPermissions(url, {})
     await db.run(knex('installed_applications').delete().where({userId, url}))
@@ -127,6 +126,16 @@ module.exports = {
 // internal methods
 // =
 
+function toDatOrigin (url) {
+  try {
+    var urlParsed = new URL(url)
+  } catch (e) {
+    throw new Error('Invalid URL: ' + url)
+  }
+  if (urlParsed.protocol !== 'dat:') throw new Error('Can only install dat applications')
+  return `${urlParsed.protocol}//${urlParsed.hostname}`.replace('+preview', '')
+}
+
 function getArchivePerms (archiveInfo) {
   try {
     return archiveInfo.manifest.application.permissions
diff --git a/web-apis/bg/dat-archive.js b/web-apis/bg/dat-archive.js
index 4cba76a2..239066b2 100644
--- a/web-apis/bg/dat-archive.js
+++ b/web-apis/bg/dat-archive.js
@@ -170,7 +170,7 @@ module.exports = {
       return {
         key: info.key,
         url: info.url,
-        dnsName: info.dnsName,
+        domain: info.domain,
         isOwner: info.isOwner,
         // networked: info.userSettings.networked,
 
diff --git a/web-apis/bg/navigator.js b/web-apis/bg/navigator.js
index ba8f1930..2f604016 100644
--- a/web-apis/bg/navigator.js
+++ b/web-apis/bg/navigator.js
@@ -170,7 +170,7 @@ module.exports = {
    * @returns {Promise<ApplicationState>}
    */
   async getApplicationState () {
-    var url = await appPerms.toDatOrigin(this.sender.getURL())
+    var url = await dat.library.getPrimaryUrl(this.sender.getURL())
     var userId = await appPerms.getSessionUserId(this.sender)
     var archiveInfo = await dat.library.getArchiveInfo(url)
     var record = await db.get(knex('installed_applications').where({userId, url}))

From db3000ca65ff728368ab28b5cba84998b784c2f7 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 16 Jul 2019 23:09:53 -0500
Subject: [PATCH 221/245] Expose an applications API

---
 applications.js          | 69 ++++++++++++++++++++++++++++++++++++++++
 index.js                 |  2 ++
 web-apis/bg/navigator.js | 59 ++--------------------------------
 3 files changed, 74 insertions(+), 56 deletions(-)
 create mode 100644 applications.js

diff --git a/applications.js b/applications.js
new file mode 100644
index 00000000..3051b94b
--- /dev/null
+++ b/applications.js
@@ -0,0 +1,69 @@
+const appPerms = require('./lib/app-perms')
+const knex = require('./lib/knex')
+const db = require('./dbs/profile-data-db')
+const sitedataDb = require('./dbs/sitedata')
+const dat = require('./dat')
+
+// typedefs
+// =
+
+/**
+ * @typedef {Object} ApplicationPermission
+ * @prop {string} id
+ * @prop {string[]} caps
+ * @prop {string} description
+ *
+ * @typedef {Object} ApplicationState
+ * @prop {string} url
+ * @prop {ApplicationPermission[]} permissions
+ * @prop {boolean} installed
+ * @prop {boolean} enabled
+ * @prop {string} installedAt
+ */
+
+// exported api
+// =
+
+/**
+ * @param {Object} opts
+ * @param {number} opts.userId
+ * @param {string} opts.url
+ * @returns {Promise<ApplicationState>}
+ */
+exports.getApplicationState = async function ({userId, url}) {
+  url = await dat.library.getPrimaryUrl(url)
+  var record = await db.get(knex('installed_applications').where({userId, url}))
+  if (record) {
+    record.installed = true
+  } else {
+    record = {
+      url,
+      installed: false,
+      enabled: false,
+      installedAt: null
+    }
+  }
+  record.permissions = await sitedataDb.getAppPermissions(record.url)
+  return massageAppRecord(record)
+}
+
+// internal methods
+// =
+
+/**
+ * @param {Object} record
+ * @returns {ApplicationState}
+ */
+function massageAppRecord (record) {
+  return {
+    url: record.url,
+    permissions: Object.entries(record.permissions).map(([id, caps]) => ({
+      id,
+      caps,
+      description: appPerms.describePerm(id, caps)
+    })),
+    installed: record.installed,
+    enabled: Boolean(record.enabled),
+    installedAt: record.createdAt ? (new Date(record.createdAt)).toISOString() : null
+  }
+}
\ No newline at end of file
diff --git a/index.js b/index.js
index 8807b576..4c6df73f 100644
--- a/index.js
+++ b/index.js
@@ -3,6 +3,7 @@ const {join} = require('path')
 const debugLogger = require('./lib/debug-logger')
 const globals = require('./globals')
 const logger = require('./logger')
+const applications = require('./applications')
 const {getEnvVar} = require('./lib/env')
 const dat = require('./dat')
 const dbs = require('./dbs')
@@ -18,6 +19,7 @@ module.exports = {
   logger,
   dat,
   dbs,
+  applications,
   crawler,
   users,
   spellChecker,
diff --git a/web-apis/bg/navigator.js b/web-apis/bg/navigator.js
index 2f604016..1f2a2d58 100644
--- a/web-apis/bg/navigator.js
+++ b/web-apis/bg/navigator.js
@@ -1,31 +1,14 @@
 const globals = require('../../globals')
 const assert = require('assert')
 const { UserDeniedError } = require('beaker-error-constants')
-const dat = require('../../dat')
 const appPerms = require('../../lib/app-perms')
-const knex = require('../../lib/knex')
-const db = require('../../dbs/profile-data-db')
-const sitedataDb = require('../../dbs/sitedata')
+const applications = require('../../applications')
 
 // typedefs
 // =
 
 /**
- * @typedef {import('../../users').User} User
- *
- * @typedef {Object} ApplicationPermission
- * @prop {string} id
- * @prop {string[]} caps
- * @prop {string} description
- *
- * @typedef {Object} ApplicationState
- * @prop {string} url
- * @prop {string} title
- * @prop {string} description
- * @prop {ApplicationPermission[]} permissions
- * @prop {boolean} installed
- * @prop {boolean} enabled
- * @prop {string} installedAt
+ * @typedef {import('../../applications').ApplicationState} ApplicationState
  */
 
 // exported api
@@ -170,47 +153,11 @@ module.exports = {
    * @returns {Promise<ApplicationState>}
    */
   async getApplicationState () {
-    var url = await dat.library.getPrimaryUrl(this.sender.getURL())
     var userId = await appPerms.getSessionUserId(this.sender)
-    var archiveInfo = await dat.library.getArchiveInfo(url)
-    var record = await db.get(knex('installed_applications').where({userId, url}))
-    if (record) {
-      record.installed = true
-    } else {
-      record = {
-        url,
-        installed: false,
-        enabled: false,
-        installedAt: null
-      }
-    }
-    record.title = archiveInfo.title
-    record.description = archiveInfo.description
-    record.permissions = await sitedataDb.getAppPermissions(record.url)
-    return massageAppRecord(record)
+    return applications.getApplicationState({url: this.sender.getURL(), userId})
   }
 }
 
 function isStrArray (v) {
   return (Array.isArray(v) && v.every(el => typeof el === 'string'))
 }
-
-/**
- * @param {Object} record
- * @returns {ApplicationState}
- */
-function massageAppRecord (record) {
-  return {
-    url: record.url,
-    title: record.title,
-    description: record.description,
-    permissions: Object.entries(record.permissions).map(([id, caps]) => ({
-      id,
-      caps,
-      description: appPerms.describePerm(id, caps)
-    })),
-    installed: record.installed,
-    enabled: Boolean(record.enabled),
-    installedAt: record.createdAt ? (new Date(record.createdAt)).toISOString() : null
-  }
-}
\ No newline at end of file

From 82c53710e73a706f1a8aecb4d760e3a3d625276a Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 26 Jul 2019 14:05:33 -0500
Subject: [PATCH 222/245] Update listSuggestions for current types

---
 crawler/search.js | 74 +++++++++++++++++++++++++++++++++++------------
 1 file changed, 56 insertions(+), 18 deletions(-)

diff --git a/crawler/search.js b/crawler/search.js
index ba249680..48e42073 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -8,14 +8,13 @@ const follows = require('./follows')
 const siteDescriptions = require('./site-descriptions')
 const {getSiteDescriptionThumbnailUrl} = require('./util')
 const knex = require('../lib/knex')
+const users = require('../users')
 
-/** @type {Array<Object>} */
-const BUILTIN_PAGES = [
-  {title: 'Beaker.Social', url: 'dat://beaker.social'},
-  {title: 'Library', url: 'beaker://library'},
-  {title: 'History', url: 'beaker://history'},
-  {title: 'Downloads', url: 'beaker://downloads'},
-  {title: 'Settings', url: 'beaker://settings'},
+const KNOWN_SITE_TYPES = [
+  'unwalled.garden/person',
+  'application',
+  'unwalled.garden/module',
+  'unwalled.garden/template'
 ]
 
 // typedefs
@@ -26,10 +25,11 @@ const BUILTIN_PAGES = [
  * @typedef {import("../dbs/archives").LibraryArchiveRecord} LibraryArchiveRecord
  *
  * @typedef {Object} SuggestionResults
- * @prop {Array<Object>} builtins
- * @prop {Array<Object>} addressbook
  * @prop {Array<Object>} bookmarks
+ * @prop {Array<Object>} apps
  * @prop {Array<Object>} websites
+ * @prop {Array<Object>} people
+ * @prop {Array<Object>} templates
  * @prop {(undefined|Array<Object>)} history
  *
  * TODO: define the SuggestionResults values
@@ -90,16 +90,26 @@ const BUILTIN_PAGES = [
  * @returns {Promise<SuggestionResults>}
  */
 exports.listSuggestions = async function (user, query = '', opts = {}) {
-  var suggestions = {}
+  var suggestions = {
+    bookmarks: [],
+    apps: [],
+    websites: [],
+    people: [],
+    templates: [],
+    history: undefined
+  }
   const filterFn = a => query ? ((a.url || a.href).includes(query) || a.title.toLowerCase().includes(query)) : true
+  const sortFn = (a, b) => (a.title||'').localeCompare(b.title||'')
+  function dedup (arr) {
+    var hits = new Set()
+    return arr.filter(item => {
+      if (hits.has(item.url)) return false
+      hits.add(item.url)
+      return true
+    })
+  }
 
-  // builtin pages
-  suggestions.builtins = BUILTIN_PAGES.filter(a => query ? a.title.toLowerCase().includes(query) : true)
-
-  // addressbook
-  suggestions.addressbook = (await follows.list({filters: {authors: user}})).map(({topic}) => topic)
-  suggestions.addressbook = [await siteDescriptions.getBest({topic: user, author: user})].concat(suggestions.addressbook)
-  suggestions.addressbook = suggestions.addressbook.filter(filterFn)
+  var userId = (await users.get(user)).id
 
   // bookmarks
   var bookmarkResults = await bookmarksDb.listBookmarks(0)
@@ -108,13 +118,41 @@ exports.listSuggestions = async function (user, query = '', opts = {}) {
   } else {
     bookmarkResults = bookmarkResults.filter(filterFn)
   }
+  bookmarkResults.sort(sortFn)
   bookmarkResults = bookmarkResults.slice(0, 12)
   suggestions.bookmarks = bookmarkResults.map(b => ({title: b.title, url: b.href}))
 
+  // apps
+  suggestions.apps = await db.all(knex('installed_applications').where({userId}))
+  await Promise.all(suggestions.apps.map(async (record) => {
+    var archiveInfo = await datLibrary.getArchiveInfo(record.url)
+    record.title = archiveInfo.title
+  }))
+  suggestions.apps = (await datLibrary.queryArchives({isSaved: true, type: 'application'})).concat(suggestions.apps)
+  suggestions.apps = dedup(suggestions.apps)
+  suggestions.apps = suggestions.apps.filter(filterFn)
+  suggestions.apps.sort(sortFn)
+
   // websites
   suggestions.websites = /** @type LibraryArchiveRecord[] */(await datLibrary.queryArchives({isSaved: true}))
-  suggestions.websites = suggestions.websites.filter(w => w.url !== user) // filter out the user's site
+  suggestions.websites = suggestions.websites.filter(w => (
+    w.url !== user // filter out the user's site
+    && (!w.type || !w.type.find(t => KNOWN_SITE_TYPES.includes(t))) // filter out other site types
+  ))
   suggestions.websites = suggestions.websites.filter(filterFn)
+  suggestions.websites.sort(sortFn)
+
+  // people
+  suggestions.people = (await follows.list({filters: {authors: user}})).map(({topic}) => topic)
+  suggestions.people = (await datLibrary.queryArchives({isSaved: true, type: 'unwalled.garden/person'})).concat(suggestions.people)
+  suggestions.people = dedup(suggestions.people)
+  suggestions.people = suggestions.people.filter(filterFn)
+  suggestions.people.sort(sortFn)
+
+  // templates
+  suggestions.templates = /** @type LibraryArchiveRecord[] */(await datLibrary.queryArchives({isSaved: true, type: 'unwalled.garden/template'}))
+  suggestions.templates = suggestions.templates.filter(filterFn)
+  suggestions.templates.sort(sortFn)
 
   if (query) {
     // history

From b5100e24d5a4c8b0d37e5ea7983568a9486124dc Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 26 Jul 2019 14:05:46 -0500
Subject: [PATCH 223/245] Add beaker.browser.toggleSidebar

---
 web-apis/fg/beaker.js                  | 1 +
 web-apis/manifests/internal/browser.js | 1 +
 2 files changed, 2 insertions(+)

diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index d7cb08f0..aeebefd6 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -107,6 +107,7 @@ exports.setup = function (rpc) {
     beaker.browser.getBuiltinFavicon = beakerBrowserRPC.getBuiltinFavicon
     beaker.browser.uploadFavicon = beakerBrowserRPC.uploadFavicon
     beaker.browser.imageToIco = beakerBrowserRPC.imageToIco
+    beaker.browser.toggleSidebar = beakerBrowserRPC.toggleSidebar
     beaker.browser.setWindowDimensions = beakerBrowserRPC.setWindowDimensions
     beaker.browser.showOpenDialog = beakerBrowserRPC.showOpenDialog
     beaker.browser.showContextMenu = beakerBrowserRPC.showContextMenu
diff --git a/web-apis/manifests/internal/browser.js b/web-apis/manifests/internal/browser.js
index 4d32fa28..c18d9cdf 100644
--- a/web-apis/manifests/internal/browser.js
+++ b/web-apis/manifests/internal/browser.js
@@ -30,6 +30,7 @@ module.exports = {
 
   getResourceContentType: 'sync',
 
+  toggleSidebar: 'promise',
   setWindowDimensions: 'promise',
   showOpenDialog: 'promise',
   showContextMenu: 'promise',

From 2127825df0de9ff1610b4c5905aee5904609559e Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 26 Jul 2019 16:46:57 -0500
Subject: [PATCH 224/245] Remove quad9 from dns providers (it was failing
 unwalled.garden lookups)

---
 dat/dns.js | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/dat/dns.js b/dat/dns.js
index 2fc64fa9..4cbf6379 100644
--- a/dat/dns.js
+++ b/dat/dns.js
@@ -5,9 +5,15 @@ const library = require('./library')
 const {DAT_HASH_REGEX} = require('../lib/const')
 const logger = require('../logger').child({category: 'dat', subcategory: 'dns'})
 
+const DNS_PROVIDERS = [['cloudflare-dns.com','/dns-query'],['dns.google.com','/resolve']]
+const DNS_PROVIDER = DNS_PROVIDERS[Math.random() > 0.5 ? 1 : 0]
+logger.info(`Using ${DNS_PROVIDER[0]} to resolve DNS lookups`)
+
 // instantate a dns cache and export it
 const datDns = require('dat-dns')({
-  persistentCache: {read, write}
+  persistentCache: {read, write},
+  dnsHost: DNS_PROVIDER[0],
+  dnsPath: DNS_PROVIDER[1]
 })
 module.exports = datDns
 

From 0e28de5b585ff61153de7d3712e33e8c2f3c6ae3 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 26 Jul 2019 17:55:54 -0500
Subject: [PATCH 225/245] Add beaker.browser. moveWindow and maximizeWindow

---
 web-apis/fg/beaker.js                  | 2 ++
 web-apis/manifests/internal/browser.js | 2 ++
 2 files changed, 4 insertions(+)

diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index aeebefd6..10569d69 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -109,6 +109,8 @@ exports.setup = function (rpc) {
     beaker.browser.imageToIco = beakerBrowserRPC.imageToIco
     beaker.browser.toggleSidebar = beakerBrowserRPC.toggleSidebar
     beaker.browser.setWindowDimensions = beakerBrowserRPC.setWindowDimensions
+    beaker.browser.moveWindow = beakerBrowserRPC.moveWindow
+    beaker.browser.maximizeWindow = beakerBrowserRPC.maximizeWindow
     beaker.browser.showOpenDialog = beakerBrowserRPC.showOpenDialog
     beaker.browser.showContextMenu = beakerBrowserRPC.showContextMenu
     beaker.browser.showModal = beakerBrowserRPC.showModal
diff --git a/web-apis/manifests/internal/browser.js b/web-apis/manifests/internal/browser.js
index c18d9cdf..a47dce9d 100644
--- a/web-apis/manifests/internal/browser.js
+++ b/web-apis/manifests/internal/browser.js
@@ -32,6 +32,8 @@ module.exports = {
 
   toggleSidebar: 'promise',
   setWindowDimensions: 'promise',
+  moveWindow: 'promise',
+  maximizeWindow: 'promise',
   showOpenDialog: 'promise',
   showContextMenu: 'promise',
   showModal: 'promise',

From bf421130ce4ae40975bb9286b96cde4f4b522218 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 27 Jul 2019 09:25:37 -0500
Subject: [PATCH 226/245] Add beaker.browser.setWindowDragModeEnabled

---
 web-apis/fg/beaker.js                  | 1 +
 web-apis/manifests/internal/browser.js | 1 +
 2 files changed, 2 insertions(+)

diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index 10569d69..79c8ef8e 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -109,6 +109,7 @@ exports.setup = function (rpc) {
     beaker.browser.imageToIco = beakerBrowserRPC.imageToIco
     beaker.browser.toggleSidebar = beakerBrowserRPC.toggleSidebar
     beaker.browser.setWindowDimensions = beakerBrowserRPC.setWindowDimensions
+    beaker.browser.setWindowDragModeEnabled = beakerBrowserRPC.setWindowDragModeEnabled
     beaker.browser.moveWindow = beakerBrowserRPC.moveWindow
     beaker.browser.maximizeWindow = beakerBrowserRPC.maximizeWindow
     beaker.browser.showOpenDialog = beakerBrowserRPC.showOpenDialog
diff --git a/web-apis/manifests/internal/browser.js b/web-apis/manifests/internal/browser.js
index a47dce9d..f5024dcc 100644
--- a/web-apis/manifests/internal/browser.js
+++ b/web-apis/manifests/internal/browser.js
@@ -32,6 +32,7 @@ module.exports = {
 
   toggleSidebar: 'promise',
   setWindowDimensions: 'promise',
+  setWindowDragModeEnabled: 'promise',
   moveWindow: 'promise',
   maximizeWindow: 'promise',
   showOpenDialog: 'promise',

From 2be4dc151a258e198a12177706f011384e6caf90 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 27 Jul 2019 16:11:17 -0500
Subject: [PATCH 227/245] Factor out dat-serve-resolve-path and remove markdown
 styles

---
 dat/protocol.js   |  56 +------------
 lib/markdown.js   | 197 ++++++++++++++++++++++++----------------------
 package-lock.json |  20 +++++
 package.json      |   2 +
 4 files changed, 127 insertions(+), 148 deletions(-)

diff --git a/dat/protocol.js b/dat/protocol.js
index f5985370..4123d94d 100644
--- a/dat/protocol.js
+++ b/dat/protocol.js
@@ -10,6 +10,7 @@ const markdown = require('../lib/markdown')
 
 const datDns = require('./dns')
 const datLibrary = require('./library')
+const datServeResolvePath = require('@beaker/dat-serve-resolve-path')
 
 const directoryListingPage = require('./directory-listing-page')
 const errorPage = require('../lib/error-page')
@@ -198,55 +199,7 @@ exports.electronHandler = async function (request, respond) {
   // lookup entry
   var statusCode = 200
   var headers = {}
-  var entry
-  const tryStat = async (path) => {
-    // abort if we've already found it
-    if (entry) return
-    // apply the web_root config
-    if (manifest && manifest.web_root && !urlp.query.disable_web_root) {
-      if (path) {
-        path = join(manifest.web_root, path)
-      } else {
-        path = manifest.web_root
-      }
-    }
-    // attempt lookup
-    try {
-      entry = await checkoutFS.pda.stat(path)
-      entry.path = path
-    } catch (e) {}
-  }
-
-  // do lookup
-  if (hasTrailingSlash) {
-    await tryStat(filepath + 'index.html')
-    await tryStat(filepath + 'index.md')
-    await tryStat(filepath)
-  } else {
-    await tryStat(filepath)
-    for (let ext of mime.acceptHeaderExtensions(request.headers.Accept)) {
-      // fallback to different requested headers
-      await tryStat(filepath + ext)
-    }
-    if (entry && entry.isDirectory()) {
-      // unexpected directory, give the .html fallback a chance
-      let dirEntry = entry
-      entry = null
-      await tryStat(filepath + '.html') // fallback to .html
-      if (dirEntry && !entry) {
-        // no .html fallback found, stick with directory that we found
-        entry = dirEntry
-      }
-    }
-  }
-
-  // check for a fallback page
-  const useFallback = Boolean(manifest && manifest.fallback_page && !urlp.query.disable_fallback_page)
-  if (useFallback && (!entry || entry.isDirectory())) {
-    let tmp = entry; entry = null
-    await tryStat(manifest.fallback_page)
-    if (!entry) entry = tmp
-  }
+  var entry = await datServeResolvePath(checkoutFS.pda, manifest, urlp, request.headers.Accept)
 
   // handle folder
   if (entry && entry.isDirectory()) {
@@ -331,16 +284,13 @@ exports.electronHandler = async function (request, respond) {
 
   // markdown rendering
   if (!range && entry.path.endsWith('.md') && mime.acceptHeaderMarkdownToHtml(request.headers.Accept)) {
-    let nav = false
-    try { nav = await checkoutFS.pda.readFile('/nav.md', 'utf8') }
-    catch (e) { /* ignore */ }
     let content = await checkoutFS.pda.readFile(entry.path, 'utf8')
     return respond({
       statusCode: 200,
       headers: Object.assign(headers, {
         'Content-Type': 'text/html'
       }),
-      data: intoStream(markdown.render(nav, content))
+      data: intoStream(markdown.render(content))
     })
   }
 
diff --git a/lib/markdown.js b/lib/markdown.js
index d56d0248..eef0d78f 100644
--- a/lib/markdown.js
+++ b/lib/markdown.js
@@ -1,4 +1,5 @@
 const MarkdownIt = require('markdown-it')
+const emojiRegex = require('emoji-regex')
 
 var md = MarkdownIt({
   html: true, // Enable HTML tags in source
@@ -19,106 +20,112 @@ var md = MarkdownIt({
   highlight: function (/* str, lang */) { return '' }
 })
 
-exports.render = function (nav, content) {
+// add IDs to headings
+var numRepetitions = {}
+md.renderer.rules.heading_open = function (tokens, idx /*, options, env */) {
+  var txt = tokens[idx + 1].content || ''
+  numRepetitions[txt] = (numRepetitions[txt]) ? numRepetitions[txt] + 1 : 0
+  return '<' + tokens[idx].tag + ' id="' + anchorMarkdownHeader(txt, numRepetitions[txt]) + '">'
+}
+
+exports.render = function (content) {
   return `
 <html>
-  <head>
-    <style>
-      body {
-        display: flex;
-        font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Ubuntu, Cantarell, "Oxygen Sans", "Helvetica Neue", sans-serif;
-        font-size: 14px;
-        width: 100%;
-        line-height: 22.5px;
-      }
-      main {
-        flex: 1;
-        max-width: 860px;
-        margin: 0 auto;
-      }
-      nav {
-        max-width: 200px;
-        padding-right: 4em;
-        overflow: hidden;
-        margin: 0.5em 0;
-      }
-      @media (min-width: 1300px) {
-        nav {
-          position: fixed; /* on wide screens, dont cause the <main> to be offset at all */
-        }
-      }
-      hr {
-        border: 0;
-        border-top: 1px solid #ccc;
-        margin: 1em 0;
-      }
-      blockquote {
-        margin: 0;
-        padding: 0 1em;
-        border-left: 1em solid #eee;
-      }
-      table {
-        border-collapse: collapse;
-      }
-      td, th {
-        padding: 0.5em 1em;
-      }
-      tbody tr:nth-child(odd) {
-        background: #fafafa;
-      }
-      tbody td {
-        border-top: 1px solid #bbb;
-      }
-      a {
-        color: #2864dc;
-        text-decoration: none;
-      }
-      a:hover {
-        text-decoration: underline;
-      }
-      h1, h2,  h3 {
-        margin: 15px 0;
-        font-weight: 600;
-      }
-      h1, h2 {
-        border-bottom: 1px solid #eee;
-        line-height: 45px;
-      }
-      h1 {
-        font-size: 30px;
-      }
-      h2 {
-        font-size: 24px;
-      }
-      h3 {
-        font-size: 20px;
-      }
-      ul, ol {
-        margin-bottom: 15px;
-      }
-      pre, code {
-        font-family: Consolas, 'Lucida Console', Monaco, monospace;
-        font-size: 13.5px;
-        background: #f0f0f0;
-        border-radius: 2px;
-      }
-      pre {
-        padding: 15px;
-        border: 0;
-        overflow-x: auto;
-      }
-      code {
-        padding: 3px 5px;
-      }
-      pre > code {
-        display: block;
-      }
-    </style>
-  </head>
   <body>
-    ${nav ? `<nav>${md.render(nav)}</nav>` : ''}
     <main>${md.render(content)}</main>
   </body>
 </html>
   `
 }
+
+/**
+https://github.com/thlorenz/anchor-markdown-header
+
+Copyright 2013 Thorsten Lorenz.
+All rights reserved.
+
+Permission is hereby granted, free of charge, to any person
+obtaining a copy of this software and associated documentation
+files (the "Software"), to deal in the Software without
+restriction, including without limitation the rights to use,
+copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the
+Software is furnished to do so, subject to the following
+conditions:
+
+The above copyright notice and this permission notice shall be
+included in all copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+ function basicGithubId (text) {
+  return text.replace(/ /g, '-')
+    // escape codes
+    .replace(/%([abcdef]|\d){2,2}/ig, '')
+    // single chars that are removed
+    .replace(/[/?!:[\]`.,()*"';{}+=<>~$|#@&–—]/g, '')
+    // CJK punctuations that are removed
+    .replace(/[。？！，、；：“”【】（）〔〕［］﹃﹄“ ”‘’﹁﹂—…－～《》〈〉「」]/g, '')
+}
+
+function getGithubId (text, repetition) {
+  text = basicGithubId(text)
+
+  // If no repetition, or if the repetition is 0 then ignore. Otherwise append '-' and the number.
+  if (repetition) {
+    text += '-' + repetition
+  }
+
+  // Strip emojis
+  text = text.replace(emojiRegex(), '')
+
+  return text
+}
+
+/**
+ * Generates an anchor for the given header and mode.
+ *
+ * @name anchorMarkdownHeader
+ * @function
+ * @param header      {String} The header to be anchored.
+ * @param repetition  {Number} The nth occurrence of this header text, starting with 0. Not required for the 0th instance.
+ * @return            {String} The header anchor id
+ */
+function anchorMarkdownHeader (header, repetition) {
+  var replace
+  var customEncodeURI = encodeURI
+
+  replace = getGithubId
+  customEncodeURI = function (uri) {
+    var newURI = encodeURI(uri)
+
+    // encodeURI replaces the zero width joiner character
+    // (used to generate emoji sequences, e.g.Female Construction Worker 👷🏼‍♀️)
+    // github doesn't URL encode them, so we replace them after url encoding to preserve the zwj character.
+    return newURI.replace(/%E2%80%8D/g, '\u200D')
+  }
+
+  function asciiOnlyToLowerCase (input) {
+    var result = ''
+    for (var i = 0; i < input.length; ++i) {
+      if (input[i] >= 'A' && input[i] <= 'Z') {
+        result += input[i].toLowerCase()
+      } else {
+        result += input[i]
+      }
+    }
+    return result
+  }
+
+  var href = replace(asciiOnlyToLowerCase(header.trim()), repetition)
+
+  return customEncodeURI(href)
+};
\ No newline at end of file
diff --git a/package-lock.json b/package-lock.json
index e57799e2..5e3b109b 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -21,6 +21,21 @@
         "protocol-buffers-encodings": "^1.1.0"
       }
     },
+    "@beaker/dat-serve-resolve-path": {
+      "version": "1.0.0",
+      "resolved": "https://registry.npmjs.org/@beaker/dat-serve-resolve-path/-/dat-serve-resolve-path-1.0.0.tgz",
+      "integrity": "sha512-ohW9nPTY9gft09Hss8V78Y4rzgYOkbESDjeIDm2KcJIIEEQzdvNFgbGWiPYyPRguYW5ppF7ZorM6huWRbo3bGA==",
+      "requires": {
+        "parse-dat-url": "^3.0.2"
+      },
+      "dependencies": {
+        "parse-dat-url": {
+          "version": "3.0.2",
+          "resolved": "https://registry.npmjs.org/parse-dat-url/-/parse-dat-url-3.0.2.tgz",
+          "integrity": "sha512-LziANMyzJU14WrwPKGRyiwGRbgNPf9dcsWmBcA3KeaDpyiD5MvPBLhbBn08jg8DQiSS4nBBR2xTgeJybMVzp6g=="
+        }
+      }
+    },
     "@beaker/dat-session-data-ext-msg": {
       "version": "1.1.1",
       "resolved": "https://registry.npmjs.org/@beaker/dat-session-data-ext-msg/-/dat-session-data-ext-msg-1.1.1.tgz",
@@ -1114,6 +1129,11 @@
         "through": "~2.3.4"
       }
     },
+    "emoji-regex": {
+      "version": "8.0.0",
+      "resolved": "https://registry.npmjs.org/emoji-regex/-/emoji-regex-8.0.0.tgz",
+      "integrity": "sha512-MSjYzcWNOA0ewAHpz0MxpYFvwg6yjy1NG3xteoqz644VCo/RPgnr1/GGt+ic3iJTzQ8Eu3TdM14SawnVUmGE6A=="
+    },
     "enabled": {
       "version": "1.0.2",
       "resolved": "https://registry.npmjs.org/enabled/-/enabled-1.0.2.tgz",
diff --git a/package.json b/package.json
index d1b798b1..5984f2a2 100644
--- a/package.json
+++ b/package.json
@@ -26,6 +26,7 @@
   "homepage": "https://github.com/beakerbrowser/beaker-core#readme",
   "dependencies": {
     "@beaker/dat-ephemeral-ext-msg": "^1.0.2",
+    "@beaker/dat-serve-resolve-path": "^1.0.0",
     "@beaker/dat-session-data-ext-msg": "^1.1.0",
     "@beaker/datignore": "^1.0.0",
     "ajv": "^6.7.0",
@@ -43,6 +44,7 @@
     "diff-file-tree": "^2.2.0",
     "discovery-swarm": "^6.0.0",
     "emit-stream": "^0.1.2",
+    "emoji-regex": "^8.0.0",
     "fs-jetpack": "^1.3.1",
     "fs-reverse": "0.0.3",
     "function-queue": "0.0.12",

From d8957d1f5afa72a16658bb4c85d694de71ab5ca4 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sat, 27 Jul 2019 16:11:35 -0500
Subject: [PATCH 228/245] Add beaker.browser toggleLiveReloading() and
 gotoUrl()

---
 dat/dns.js                             | 2 +-
 web-apis/fg/beaker.js                  | 2 ++
 web-apis/manifests/internal/browser.js | 2 ++
 3 files changed, 5 insertions(+), 1 deletion(-)

diff --git a/dat/dns.js b/dat/dns.js
index 4cbf6379..b75e6f57 100644
--- a/dat/dns.js
+++ b/dat/dns.js
@@ -5,7 +5,7 @@ const library = require('./library')
 const {DAT_HASH_REGEX} = require('../lib/const')
 const logger = require('../logger').child({category: 'dat', subcategory: 'dns'})
 
-const DNS_PROVIDERS = [['cloudflare-dns.com','/dns-query'],['dns.google.com','/resolve']]
+const DNS_PROVIDERS = [['cloudflare-dns.com', '/dns-query'], ['dns.google.com', '/resolve']]
 const DNS_PROVIDER = DNS_PROVIDERS[Math.random() > 0.5 ? 1 : 0]
 logger.info(`Using ${DNS_PROVIDER[0]} to resolve DNS lookups`)
 
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index 79c8ef8e..80f46155 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -108,6 +108,7 @@ exports.setup = function (rpc) {
     beaker.browser.uploadFavicon = beakerBrowserRPC.uploadFavicon
     beaker.browser.imageToIco = beakerBrowserRPC.imageToIco
     beaker.browser.toggleSidebar = beakerBrowserRPC.toggleSidebar
+    beaker.browser.toggleLiveReloading = beakerBrowserRPC.toggleLiveReloading
     beaker.browser.setWindowDimensions = beakerBrowserRPC.setWindowDimensions
     beaker.browser.setWindowDragModeEnabled = beakerBrowserRPC.setWindowDragModeEnabled
     beaker.browser.moveWindow = beakerBrowserRPC.moveWindow
@@ -116,6 +117,7 @@ exports.setup = function (rpc) {
     beaker.browser.showContextMenu = beakerBrowserRPC.showContextMenu
     beaker.browser.showModal = beakerBrowserRPC.showModal
     beaker.browser.openUrl = beakerBrowserRPC.openUrl
+    beaker.browser.gotoUrl = beakerBrowserRPC.gotoUrl
     beaker.browser.openFolder = beakerBrowserRPC.openFolder
     beaker.browser.doWebcontentsCmd = beakerBrowserRPC.doWebcontentsCmd
     beaker.browser.doTest = beakerBrowserRPC.doTest
diff --git a/web-apis/manifests/internal/browser.js b/web-apis/manifests/internal/browser.js
index f5024dcc..402f2adb 100644
--- a/web-apis/manifests/internal/browser.js
+++ b/web-apis/manifests/internal/browser.js
@@ -31,6 +31,7 @@ module.exports = {
   getResourceContentType: 'sync',
 
   toggleSidebar: 'promise',
+  toggleLiveReloading: 'promise',
   setWindowDimensions: 'promise',
   setWindowDragModeEnabled: 'promise',
   moveWindow: 'promise',
@@ -39,6 +40,7 @@ module.exports = {
   showContextMenu: 'promise',
   showModal: 'promise',
   openUrl: 'promise',
+  gotoUrl: 'promise',
   openFolder: 'promise',
   doWebcontentsCmd: 'promise',
   doTest: 'promise',

From d1b1cd1c9fcf27a530d4756d74125dd943239741 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 2 Aug 2019 08:27:36 -0500
Subject: [PATCH 229/245] Fix handling of visiting +preview on a site that
 doesnt have it enabled

---
 dat/daemon/index.js |  1 -
 dat/protocol.js     | 15 ++++++++++-----
 2 files changed, 10 insertions(+), 6 deletions(-)

diff --git a/dat/daemon/index.js b/dat/daemon/index.js
index de49631e..c7ef8f9f 100644
--- a/dat/daemon/index.js
+++ b/dat/daemon/index.js
@@ -309,7 +309,6 @@ const RPC_API = {
   // =
 
   callArchiveAsyncMethod (key, version, method, ...args) {
-    var cb = args.slice(-1)[0]
     var checkout = getArchiveCheckout(key, version)
     checkout[method](...args)
   },
diff --git a/dat/protocol.js b/dat/protocol.js
index 4123d94d..50bead63 100644
--- a/dat/protocol.js
+++ b/dat/protocol.js
@@ -135,13 +135,18 @@ exports.electronHandler = async function (request, respond) {
   // checkout version if needed
   try {
     var {checkoutFS} = datLibrary.getArchiveCheckout(archive, urlp.version)
+    if (urlp.version === 'preview') {
+      await checkoutFS.pda.stat('/') // run a stat to ensure preview mode exists
+    }
   } catch (err) {
     if (err.noPreviewMode) {
-      let latestUrl = makeSafe(request.url.replace('+preview', ''))
-      respondError(404, 'Cannot open preview', {
-        title: 'Cannot open preview',
-        errorInfo: `You are trying to open the "preview" version of this site, but no preview exists.`,
-        errorDescription: `<span>You can open the <a class="link" href="${latestUrl}">latest published version</a> instead.</span>`
+      // redirect to non-preview version
+      return respond({
+        statusCode: 303,
+        headers: {
+          Location: `dat://${urlp.host}${urlp.pathname || '/'}${urlp.search || ''}`
+        },
+        data: intoStream('')
       })
     } else {
       logger.warn('Failed to open archive checkout', {url: archiveKey, err})

From b97a59d0de7e00460491086355a37fb9a009f20d Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 2 Aug 2019 15:05:40 -0500
Subject: [PATCH 230/245] Fix: ug web apis for user with a domain name now work

---
 lib/app-perms.js                           |  7 +++++++
 web-apis/bg/unwalled-garden-comments.js    | 12 +++---------
 web-apis/bg/unwalled-garden-discussions.js | 12 +++---------
 web-apis/bg/unwalled-garden-follows.js     | 12 +++---------
 web-apis/bg/unwalled-garden-media.js       | 12 +++---------
 web-apis/bg/unwalled-garden-posts.js       | 12 +++---------
 web-apis/bg/unwalled-garden-reactions.js   | 10 ++--------
 web-apis/bg/unwalled-garden-votes.js       |  8 +-------
 8 files changed, 25 insertions(+), 60 deletions(-)

diff --git a/lib/app-perms.js b/lib/app-perms.js
index 4faa52cb..b22506d0 100644
--- a/lib/app-perms.js
+++ b/lib/app-perms.js
@@ -14,6 +14,13 @@ const getSessionUserId = exports.getSessionUserId = async function (sender) {
   return (await users.get(userSession.url)).id
 }
 
+exports.getSessionUserArchive = async function (sender) {
+  var userSession = globals.userSessionAPI.getFor(sender)
+  if (!userSession) throw new Error('No active user session')
+  var key = await datLibrary.fromURLToKey(userSession.url, true)
+  return datLibrary.getArchive(key)
+}
+
 /**
  * @param {string} url
  * @returns {Promise<string>}
diff --git a/web-apis/bg/unwalled-garden-comments.js b/web-apis/bg/unwalled-garden-comments.js
index 9acb1b13..8e09cbc1 100644
--- a/web-apis/bg/unwalled-garden-comments.js
+++ b/web-apis/bg/unwalled-garden-comments.js
@@ -141,7 +141,7 @@ module.exports = {
    */
   async add (topic, comment) {
     await appPerms.assertCan(this.sender, 'unwalled.garden/perm/comments', 'write')
-    var userArchive = getUserArchive(this.sender)
+    var userArchive = await appPerms.getSessionUserArchive(this.sender)
 
     // string usage
     if (typeof comment === 'string') {
@@ -173,7 +173,7 @@ module.exports = {
    */
   async edit (url, comment) {
     await appPerms.assertCan(this.sender, 'unwalled.garden/perm/comments', 'write')
-    var userArchive = getUserArchive(this.sender)
+    var userArchive = await appPerms.getSessionUserArchive(this.sender)
 
     // string usage
     if (typeof comment === 'string') {
@@ -197,7 +197,7 @@ module.exports = {
    */
   async remove (url) {
     await appPerms.assertCan(this.sender, 'unwalled.garden/perm/comments', 'write')
-    var userArchive = getUserArchive(this.sender)
+    var userArchive = await appPerms.getSessionUserArchive(this.sender)
 
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
 
@@ -209,12 +209,6 @@ module.exports = {
 // internal methods
 // =
 
-function getUserArchive (sender) {
-  var userSession = globals.userSessionAPI.getFor(sender)
-  if (!userSession) throw new Error('No active user session')
-  return dat.library.getArchive(userSession.url)
-}
-
 /**
  * Tries to parse the URL and return the pathname. If fails, assumes the string was a pathname.
  * @param {string} url
diff --git a/web-apis/bg/unwalled-garden-discussions.js b/web-apis/bg/unwalled-garden-discussions.js
index 51118bf9..9e6f5dd3 100644
--- a/web-apis/bg/unwalled-garden-discussions.js
+++ b/web-apis/bg/unwalled-garden-discussions.js
@@ -93,7 +93,7 @@ module.exports = {
    */
   async add (discussion) {
     await appPerms.assertCan(this.sender, 'unwalled.garden/perm/discussions', 'write')
-    var userArchive = getUserArchive(this.sender)
+    var userArchive = await appPerms.getSessionUserArchive(this.sender)
 
     assert(discussion && typeof discussion === 'object', 'The `discussion` parameter must be a string or object')
     assert(discussion.title && typeof discussion.title === 'string', 'The `discussion.title` parameter must be a non-empty string')
@@ -123,7 +123,7 @@ module.exports = {
    */
   async edit (url, discussion) {
     await appPerms.assertCan(this.sender, 'unwalled.garden/perm/discussions', 'write')
-    var userArchive = getUserArchive(this.sender)
+    var userArchive = await appPerms.getSessionUserArchive(this.sender)
 
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
     assert(discussion && typeof discussion === 'object', 'The `discussion` parameter must be an object')
@@ -144,7 +144,7 @@ module.exports = {
    */
   async remove (url) {
     await appPerms.assertCan(this.sender, 'unwalled.garden/perm/discussions', 'write')
-    var userArchive = getUserArchive(this.sender)
+    var userArchive = await appPerms.getSessionUserArchive(this.sender)
 
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
 
@@ -156,12 +156,6 @@ module.exports = {
 // internal methods
 // =
 
-function getUserArchive (sender) {
-  var userSession = globals.userSessionAPI.getFor(sender)
-  if (!userSession) throw new Error('No active user session')
-  return dat.library.getArchive(userSession.url)
-}
-
 /**
  * Tries to parse the URL and return the pathname. If fails, assumes the string was a pathname.
  * @param {string} url
diff --git a/web-apis/bg/unwalled-garden-follows.js b/web-apis/bg/unwalled-garden-follows.js
index a7f00386..bea11620 100644
--- a/web-apis/bg/unwalled-garden-follows.js
+++ b/web-apis/bg/unwalled-garden-follows.js
@@ -92,7 +92,7 @@ module.exports = {
    */
   async add (topic, opts) {
     await appPerms.assertCan(this.sender, 'unwalled.garden/perm/follows', 'write')
-    var userArchive = getUserArchive(this.sender)
+    var userArchive = await appPerms.getSessionUserArchive(this.sender)
 
     topic = normalizeFollowUrl(topic)
     if (!opts) opts = {}
@@ -111,7 +111,7 @@ module.exports = {
    */
   async edit (topic, opts) {
     await appPerms.assertCan(this.sender, 'unwalled.garden/perm/follows', 'write')
-    var userArchive = getUserArchive(this.sender)
+    var userArchive = await appPerms.getSessionUserArchive(this.sender)
 
     topic = normalizeFollowUrl(topic)
     if (!opts) opts = {}
@@ -128,7 +128,7 @@ module.exports = {
    */
   async remove (topic) {
     await appPerms.assertCan(this.sender, 'unwalled.garden/perm/follows', 'write')
-    var userArchive = getUserArchive(this.sender)
+    var userArchive = await appPerms.getSessionUserArchive(this.sender)
 
     topic = normalizeFollowUrl(topic)
     assert(topic, 'The `topic` parameter must be a valid URL')
@@ -140,12 +140,6 @@ module.exports = {
 // internal methods
 // =
 
-function getUserArchive (sender) {
-  var userSession = globals.userSessionAPI.getFor(sender)
-  if (!userSession) throw new Error('No active user session')
-  return dat.library.getArchive(userSession.url)
-}
-
 /**
  * @param {string} url
  * @returns {string}
diff --git a/web-apis/bg/unwalled-garden-media.js b/web-apis/bg/unwalled-garden-media.js
index ccc060e0..8a750d03 100644
--- a/web-apis/bg/unwalled-garden-media.js
+++ b/web-apis/bg/unwalled-garden-media.js
@@ -111,7 +111,7 @@ module.exports = {
    */
   async add (media) {
     await appPerms.assertCan(this.sender, 'unwalled.garden/perm/media', 'write')
-    var userArchive = getUserArchive(this.sender)
+    var userArchive = await appPerms.getSessionUserArchive(this.sender)
 
     assert(media && typeof media === 'object', 'The `media` parameter must be a string or object')
     assert(media.subtype && typeof media.subtype === 'string', 'The `media.subtype` parameter must be a non-empty URL string')
@@ -143,7 +143,7 @@ module.exports = {
    */
   async edit (url, media) {
     await appPerms.assertCan(this.sender, 'unwalled.garden/perm/media', 'write')
-    var userArchive = getUserArchive(this.sender)
+    var userArchive = await appPerms.getSessionUserArchive(this.sender)
 
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
     assert(media && typeof media === 'object', 'The `media` parameter must be an object')
@@ -165,7 +165,7 @@ module.exports = {
    */
   async remove (url) {
     await appPerms.assertCan(this.sender, 'unwalled.garden/perm/media', 'write')
-    var userArchive = getUserArchive(this.sender)
+    var userArchive = await appPerms.getSessionUserArchive(this.sender)
 
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
 
@@ -177,12 +177,6 @@ module.exports = {
 // internal methods
 // =
 
-function getUserArchive (sender) {
-  var userSession = globals.userSessionAPI.getFor(sender)
-  if (!userSession) throw new Error('No active user session')
-  return dat.library.getArchive(userSession.url)
-}
-
 /**
  * Tries to parse the URL and return the pathname. If fails, assumes the string was a pathname.
  * @param {string} url
diff --git a/web-apis/bg/unwalled-garden-posts.js b/web-apis/bg/unwalled-garden-posts.js
index fd1126e5..7a886151 100644
--- a/web-apis/bg/unwalled-garden-posts.js
+++ b/web-apis/bg/unwalled-garden-posts.js
@@ -79,7 +79,7 @@ module.exports = {
    */
   async add (post) {
     await appPerms.assertCan(this.sender, 'unwalled.garden/perm/posts', 'write')
-    var userArchive = getUserArchive(this.sender)
+    var userArchive = await appPerms.getSessionUserArchive(this.sender)
 
     // string usage
     if (typeof post === 'string') {
@@ -108,7 +108,7 @@ module.exports = {
    */
   async edit (url, post) {
     await appPerms.assertCan(this.sender, 'unwalled.garden/perm/posts', 'write')
-    var userArchive = getUserArchive(this.sender)
+    var userArchive = await appPerms.getSessionUserArchive(this.sender)
 
     // string usage
     if (typeof post === 'string') {
@@ -131,7 +131,7 @@ module.exports = {
    */
   async remove (url) {
     await appPerms.assertCan(this.sender, 'unwalled.garden/perm/posts', 'write')
-    var userArchive = getUserArchive(this.sender)
+    var userArchive = await appPerms.getSessionUserArchive(this.sender)
 
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
 
@@ -143,12 +143,6 @@ module.exports = {
 // internal methods
 // =
 
-function getUserArchive (sender) {
-  var userSession = globals.userSessionAPI.getFor(sender)
-  if (!userSession) throw new Error('No active user session')
-  return dat.library.getArchive(userSession.url)
-}
-
 /**
  * Tries to parse the URL and return the pathname. If fails, assumes the string was a pathname.
  * @param {string} url
diff --git a/web-apis/bg/unwalled-garden-reactions.js b/web-apis/bg/unwalled-garden-reactions.js
index f919e231..703956c2 100644
--- a/web-apis/bg/unwalled-garden-reactions.js
+++ b/web-apis/bg/unwalled-garden-reactions.js
@@ -125,7 +125,7 @@ module.exports = {
    */
   async add (topic, emoji) {
     await appPerms.assertCan(this.sender, 'unwalled.garden/perm/reactions', 'write')
-    var userArchive = getUserArchive(this.sender)
+    var userArchive = await appPerms.getSessionUserArchive(this.sender)
 
     topic = normalizeTopicUrl(topic)
     assert(topic && typeof topic === 'string', 'The `topic` parameter must be a valid URL')
@@ -140,7 +140,7 @@ module.exports = {
    */
   async remove (topic, emoji) {
     await appPerms.assertCan(this.sender, 'unwalled.garden/perm/reactions', 'write')
-    var userArchive = getUserArchive(this.sender)
+    var userArchive = await appPerms.getSessionUserArchive(this.sender)
 
     topic = normalizeTopicUrl(topic)
     assert(topic && typeof topic === 'string', 'The `topic` parameter must be a valid URL')
@@ -152,12 +152,6 @@ module.exports = {
 // internal methods
 // =
 
-function getUserArchive (sender) {
-  var userSession = globals.userSessionAPI.getFor(sender)
-  if (!userSession) throw new Error('No active user session')
-  return dat.library.getArchive(userSession.url)
-}
-
 function normalizeTopicUrl (url) {
   try {
     url = new URL(url)
diff --git a/web-apis/bg/unwalled-garden-votes.js b/web-apis/bg/unwalled-garden-votes.js
index 9c6a003c..571c4e5c 100644
--- a/web-apis/bg/unwalled-garden-votes.js
+++ b/web-apis/bg/unwalled-garden-votes.js
@@ -143,7 +143,7 @@ module.exports = {
    */
   async set (topic, vote) {
     await appPerms.assertCan(this.sender, 'unwalled.garden/perm/votes', 'write')
-    var userArchive = getUserArchive(this.sender)
+    var userArchive = await appPerms.getSessionUserArchive(this.sender)
 
     topic = normalizeTopicUrl(topic)
     assert(topic && typeof topic === 'string', 'The `topic` parameter must be a valid URL')
@@ -156,12 +156,6 @@ module.exports = {
 // internal methods
 // =
 
-function getUserArchive (sender) {
-  var userSession = globals.userSessionAPI.getFor(sender)
-  if (!userSession) throw new Error('No active user session')
-  return dat.library.getArchive(userSession.url)
-}
-
 function normalizeTopicUrl (url) {
   try {
     url = new URL(url)

From d6daf79d3400c46f667426b0e146cef870231f4e Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 2 Aug 2019 15:19:10 -0500
Subject: [PATCH 231/245] Bump deps, temporarily use sqlite fork that builds on
 electron 6

---
 package-lock.json | 240 +++++++++++++++++++---------------------------
 package.json      |  16 ++--
 2 files changed, 108 insertions(+), 148 deletions(-)

diff --git a/package-lock.json b/package-lock.json
index 5e3b109b..cba824ee 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -27,13 +27,6 @@
       "integrity": "sha512-ohW9nPTY9gft09Hss8V78Y4rzgYOkbESDjeIDm2KcJIIEEQzdvNFgbGWiPYyPRguYW5ppF7ZorM6huWRbo3bGA==",
       "requires": {
         "parse-dat-url": "^3.0.2"
-      },
-      "dependencies": {
-        "parse-dat-url": {
-          "version": "3.0.2",
-          "resolved": "https://registry.npmjs.org/parse-dat-url/-/parse-dat-url-3.0.2.tgz",
-          "integrity": "sha512-LziANMyzJU14WrwPKGRyiwGRbgNPf9dcsWmBcA3KeaDpyiD5MvPBLhbBn08jg8DQiSS4nBBR2xTgeJybMVzp6g=="
-        }
       }
     },
     "@beaker/dat-session-data-ext-msg": {
@@ -52,9 +45,9 @@
       "integrity": "sha512-6BmYWSBea18+tSjjSC3QIyV93ZKAeNWGM7R6aYt1ryTZXrlHF+QLV0G2yV0viEGVyRkyQsWfMoJ0k/YghBX5sQ=="
     },
     "@types/node": {
-      "version": "12.0.1",
-      "resolved": "https://registry.npmjs.org/@types/node/-/node-12.0.1.tgz",
-      "integrity": "sha512-7sy7DKVJrCTbaAERJZq/CU12bzdmpjRr321/Ne9QmzhB3iZ//L16Cizcni5hHNbANxDbxwMb9EFoWkM8KPkp0A==",
+      "version": "12.6.9",
+      "resolved": "https://registry.npmjs.org/@types/node/-/node-12.6.9.tgz",
+      "integrity": "sha512-+YB9FtyxXGyD54p8rXwWaN1EWEyar5L58GlGWgtH2I9rGmLGBQcw63+0jw+ujqVavNuO47S1ByAjm9zdHMnskw==",
       "optional": true
     },
     "abbrev": {
@@ -86,9 +79,9 @@
       }
     },
     "ajv": {
-      "version": "6.10.0",
-      "resolved": "https://registry.npmjs.org/ajv/-/ajv-6.10.0.tgz",
-      "integrity": "sha512-nffhOpkymDECQyR0mnsUtoCE8RlX38G0rYP+wgLWFyZuUyuuojSSvi/+euOiQBIn63whYwYVIIH1TvE3tu4OEg==",
+      "version": "6.10.2",
+      "resolved": "https://registry.npmjs.org/ajv/-/ajv-6.10.2.tgz",
+      "integrity": "sha512-TXtUUEYHuaTEbLZWIKUr5pmBuhDLy+8KYtPYdcV8qC+pOZL+NKqYwvWSRrVXHn+ZmRRAu8vJTAznH7Oag6RVRw==",
       "requires": {
         "fast-deep-equal": "^2.0.1",
         "fast-json-stable-stringify": "^2.0.0",
@@ -231,11 +224,11 @@
       "integrity": "sha1-WWZ/QfrdTyDMvCu5a41Pf3jsA2c="
     },
     "async": {
-      "version": "2.6.2",
-      "resolved": "https://registry.npmjs.org/async/-/async-2.6.2.tgz",
-      "integrity": "sha512-H1qVYh1MYhEEFLsP97cVKqCGo7KfCyTt6uEWqsTBr9SO84oK9Uwbyd/yCW+6rKJLHksBNUVWZDAjfS+Ccx0Bbg==",
+      "version": "2.6.3",
+      "resolved": "https://registry.npmjs.org/async/-/async-2.6.3.tgz",
+      "integrity": "sha512-zflvls11DCy+dQWzTW2dzuilv8Z5X/pjfmZOWba6TNIVDm+2UDaJmXSOXlasHKfNBs8oo3M0aT50fDEWfKZjXg==",
       "requires": {
-        "lodash": "^4.17.11"
+        "lodash": "^4.17.14"
       }
     },
     "asynckit": {
@@ -609,9 +602,9 @@
       "dev": true
     },
     "chownr": {
-      "version": "1.1.1",
-      "resolved": "https://registry.npmjs.org/chownr/-/chownr-1.1.1.tgz",
-      "integrity": "sha512-j38EvO5+LHX84jlo6h4UzmOwi0UgW61WRyPtJz4qaadK5eY3BTS5TY/S1Stc3Uk2lIM6TPevAlULiEJwie860g=="
+      "version": "1.1.2",
+      "resolved": "https://registry.npmjs.org/chownr/-/chownr-1.1.2.tgz",
+      "integrity": "sha512-GkfeAQh+QNy3wquu9oIZr6SS5x7wGdSgNQvD10X3r+AZr1Oys22HW8kAmDMvNg2+Dm0TeGaEuO8gFwdBXxwO8A=="
     },
     "circular-append-file": {
       "version": "1.0.1",
@@ -1161,9 +1154,9 @@
       "integrity": "sha512-zoB603vQReOFvTg5xMl9I1P2PnHsHQQKTEowsKKD7nseUfJq6UWzK+4YtlWUO1nhiQUxe6XMkk+JleSZD1NZFA=="
     },
     "es6-promise": {
-      "version": "4.2.6",
-      "resolved": "https://registry.npmjs.org/es6-promise/-/es6-promise-4.2.6.tgz",
-      "integrity": "sha512-aRVgGdnmW2OiySVPUC9e6m+plolMAJKjZnQlCwNSuK5yQ0JN61DZSO1X1Ufd1foqWRAlig0rhduTCHe7sVtK5Q=="
+      "version": "4.2.8",
+      "resolved": "https://registry.npmjs.org/es6-promise/-/es6-promise-4.2.8.tgz",
+      "integrity": "sha512-HJDGx5daxeIvxdBxvG2cb9g4tEvwIk3i8+nhX0yGrYmZUzbkdg8QbDevheDB8gd0//uPj4c1EQua8Q+MViT0/w=="
     },
     "es6-promisify": {
       "version": "5.0.0",
@@ -1343,9 +1336,9 @@
       "dev": true
     },
     "esutils": {
-      "version": "2.0.2",
-      "resolved": "https://registry.npmjs.org/esutils/-/esutils-2.0.2.tgz",
-      "integrity": "sha1-Cr9PHKpbyx96nYrMbepPqqBLrJs=",
+      "version": "2.0.3",
+      "resolved": "https://registry.npmjs.org/esutils/-/esutils-2.0.3.tgz",
+      "integrity": "sha512-kVscqXk4OCp68SZ0dkgEKVi6/8ij300KBWTJq32P/dYeWTSwK41WyTxalN1eRmA5Z9UU/LX9D7FWSmV9SAYx6g==",
       "dev": true
     },
     "execa": {
@@ -1916,9 +1909,9 @@
       "dev": true
     },
     "graceful-fs": {
-      "version": "4.1.15",
-      "resolved": "https://registry.npmjs.org/graceful-fs/-/graceful-fs-4.1.15.tgz",
-      "integrity": "sha512-6uHUhOPEBgQ24HM+r6b/QwWfZq+yiFcipKFrOFiBEnWdy5sdzYoi+pJeQaPI5qOLRFqWmAXUPQNsielzdLoecA=="
+      "version": "4.2.0",
+      "resolved": "https://registry.npmjs.org/graceful-fs/-/graceful-fs-4.2.0.tgz",
+      "integrity": "sha512-jpSvDPV4Cq/bgtpndIWbI5hmYxhQGHPC4d4cqBPb4DLniCfhJokdXhwhaDuLBGLQdvvRum/UiX6ECVIPvDXqdg=="
     },
     "har-schema": {
       "version": "2.0.0",
@@ -2002,18 +1995,15 @@
       }
     },
     "hypercore": {
-      "version": "6.26.0",
-      "resolved": "https://registry.npmjs.org/hypercore/-/hypercore-6.26.0.tgz",
-      "integrity": "sha512-su/bucp958SyFWWF5uzeLT05N0k7gTbktvLCo0TaloXWSSs2OiFyj3Ka7v93yaD9u0vBT3i0foPoZnj1yC/dog==",
+      "version": "7.5.1",
+      "resolved": "https://registry.npmjs.org/hypercore/-/hypercore-7.5.1.tgz",
+      "integrity": "sha512-tgololYj3O6Y0Mg6PK7EJntRu+auKSYuER2a8pVetPqnDSJ1RfAVlyVr3VmuS5W9hS0PwH4OXl4R/uVfkuNNoQ==",
       "requires": {
         "array-lru": "^1.1.0",
         "atomic-batcher": "^1.0.2",
         "bitfield-rle": "^2.2.1",
-        "buffer-alloc": "^1.2.0",
-        "buffer-alloc-unsafe": "^1.0.0",
-        "buffer-from": "^1.0.0",
         "bulk-write-stream": "^1.1.3",
-        "codecs": "^1.2.0",
+        "codecs": "^2.0.0",
         "fast-bitfield": "^1.2.2",
         "fd-lock": "^1.0.2",
         "flat-tree": "^1.6.0",
@@ -2026,7 +2016,6 @@
         "memory-pager": "^1.0.2",
         "merkle-tree-stream": "^3.0.3",
         "pretty-hash": "^1.0.1",
-        "process-nextick-args": "^1.0.7",
         "random-access-file": "^2.1.0",
         "sodium-universal": "^2.0.0",
         "sparse-bitfield": "^3.0.0",
@@ -2036,10 +2025,10 @@
         "unordered-set": "^2.0.0"
       },
       "dependencies": {
-        "process-nextick-args": {
-          "version": "1.0.7",
-          "resolved": "https://registry.npmjs.org/process-nextick-args/-/process-nextick-args-1.0.7.tgz",
-          "integrity": "sha1-FQ4gt1ZZCtP5EJPyWk8q2L/zC6M="
+        "codecs": {
+          "version": "2.0.0",
+          "resolved": "https://registry.npmjs.org/codecs/-/codecs-2.0.0.tgz",
+          "integrity": "sha512-WXvpJRAgc693oqYvZte9uYEiL5YHtfrxyEq12uVny9oBJ1k37zSva5vVz7trsnt6R9Y15hEgOSC7VFZT2pfYnA=="
         },
         "thunky": {
           "version": "1.0.3",
@@ -2065,9 +2054,9 @@
       }
     },
     "hypercore-protocol": {
-      "version": "6.11.0",
-      "resolved": "https://registry.npmjs.org/hypercore-protocol/-/hypercore-protocol-6.11.0.tgz",
-      "integrity": "sha512-V/0Vru8gavoO++K2QFOAXu7xgBuXcBAjURQ9BQ48DnQ/p4hK4Jy76ulRnppDHpbDthxRziMWLZfmYXncwD63Aw==",
+      "version": "6.11.1",
+      "resolved": "https://registry.npmjs.org/hypercore-protocol/-/hypercore-protocol-6.11.1.tgz",
+      "integrity": "sha512-4vyYGzSTRCfpIPnpYO/WN0VeS2oGeIrzCCwIXfz5TL2dyyHu7wF5xiigNuUfTn9n3cTOwwbH+EKsygTNsO2yfw==",
       "requires": {
         "buffer-alloc-unsafe": "^1.0.0",
         "buffer-from": "^1.0.0",
@@ -2080,14 +2069,14 @@
       }
     },
     "hyperdrive": {
-      "version": "9.14.5",
-      "resolved": "https://registry.npmjs.org/hyperdrive/-/hyperdrive-9.14.5.tgz",
-      "integrity": "sha512-uSu6eYprXJhIYaZ7PSODNaozddTrVscZpfkHZwmOg0CKYyX03UovfLyfkhH8/QMew6n0iTg+iiyvp2zhnUapnQ==",
+      "version": "9.16.0",
+      "resolved": "https://registry.npmjs.org/hyperdrive/-/hyperdrive-9.16.0.tgz",
+      "integrity": "sha512-2iw4baOLmYEs8hWzGUmdgqLHIvjjhiM125kKhQv1aFaiwqDMLtZJ8JsxyeaRZZmMSaC9TuXwjUmU/rrPPgIoVA==",
       "requires": {
         "append-tree": "^2.3.5",
         "duplexify": "^3.5.0",
         "from2": "^2.3.0",
-        "hypercore": "^6.22.1",
+        "hypercore": "^7.5.0",
         "inherits": "^2.0.3",
         "mutexify": "^1.1.0",
         "protocol-buffers-encodings": "^1.1.0",
@@ -2182,9 +2171,9 @@
       }
     },
     "inherits": {
-      "version": "2.0.3",
-      "resolved": "https://registry.npmjs.org/inherits/-/inherits-2.0.3.tgz",
-      "integrity": "sha1-Yzwsg+PaQqUC9SRmAiSA9CCCYd4="
+      "version": "2.0.4",
+      "resolved": "https://registry.npmjs.org/inherits/-/inherits-2.0.4.tgz",
+      "integrity": "sha512-k/vGaX4/Yla3WzyMCvTQOXYeIHvqOKtnqBduzTHpzpQZzAskKMhZ2K+EnBiSM9zGSoIFeMpXKxa4dYeZIQqewQ=="
     },
     "ini": {
       "version": "1.3.5",
@@ -2710,17 +2699,17 @@
       "integrity": "sha512-XCpr5bElgDI65vVgstP8TWjv6/QKWm9GU5UG0Pr5sLQ3QLo8NVKsioe+Jed5/3vFOe3IQuqE7DKwTvKQkjTHvg=="
     },
     "linkify-it": {
-      "version": "2.1.0",
-      "resolved": "https://registry.npmjs.org/linkify-it/-/linkify-it-2.1.0.tgz",
-      "integrity": "sha512-4REs8/062kV2DSHxNfq5183zrqXMl7WP0WzABH9IeJI+NLm429FgE1PDecltYfnOoFDFlZGh2T8PfZn0r+GTRg==",
+      "version": "2.2.0",
+      "resolved": "https://registry.npmjs.org/linkify-it/-/linkify-it-2.2.0.tgz",
+      "integrity": "sha512-GnAl/knGn+i1U/wjBz3akz2stz+HrHLsxMwHQGofCDfPvlf+gDKN58UtfmUquTY4/MXeE2x7k19KQmeoZi94Iw==",
       "requires": {
         "uc.micro": "^1.0.1"
       }
     },
     "lodash": {
-      "version": "4.17.11",
-      "resolved": "https://registry.npmjs.org/lodash/-/lodash-4.17.11.tgz",
-      "integrity": "sha512-cQKh8igo5QUhZ7lg38DYWAxMvjSAKG0A8wGSVimP07SIUEK2UO+arSRKbRZWtelMtN5V0Hkwh5ryOto/SshYIg=="
+      "version": "4.17.15",
+      "resolved": "https://registry.npmjs.org/lodash/-/lodash-4.17.15.tgz",
+      "integrity": "sha512-8xOcRHvCjnocdS5cpwXQXVzmmh5e5+saE2QGoeQmbKmRS6J3VQppPOIt0MnmE+4xlZoumy0GPG0D0MVIQbNA1A=="
     },
     "lodash.debounce": {
       "version": "4.0.8",
@@ -2956,9 +2945,9 @@
       }
     },
     "mixin-deep": {
-      "version": "1.3.1",
-      "resolved": "https://registry.npmjs.org/mixin-deep/-/mixin-deep-1.3.1.tgz",
-      "integrity": "sha512-8ZItLHeEgaqEvd5lYBXfm4EZSFCX29Jb9K+lAHhDKzReKBQKj3R+7NOF6tjqYi9t4oI8VUfaWITJQm86wnXGNQ==",
+      "version": "1.3.2",
+      "resolved": "https://registry.npmjs.org/mixin-deep/-/mixin-deep-1.3.2.tgz",
+      "integrity": "sha512-WRoDn//mXBiJ1H40rqa3vH0toePwSsGb45iInWlTySa+Uu4k3tYUSxa2v1KqAiLtvlrSzaExqS1gtk96A9zvEA==",
       "requires": {
         "for-in": "^1.0.2",
         "is-extendable": "^1.0.1"
@@ -3036,9 +3025,9 @@
       "integrity": "sha512-oprzxd2zhfrJqEuB98qc1dRMMonClBQ57UPDjnbcrah4orEMTq1jq3+AcdFe5ePzdbJXI7zmdhfftIdMnhYFoQ=="
     },
     "nan": {
-      "version": "2.13.2",
-      "resolved": "https://registry.npmjs.org/nan/-/nan-2.13.2.tgz",
-      "integrity": "sha512-TghvYc72wlMGMVMluVo9WRJc0mB8KxxF/gZ4YYFy7V2ZQX9l7rgbPg7vjS9mt6U5HXODVFVI2bOduCzwOMv/lw=="
+      "version": "2.14.0",
+      "resolved": "https://registry.npmjs.org/nan/-/nan-2.14.0.tgz",
+      "integrity": "sha512-INOFj37C7k3AfaNTtX8RhsTw7qRy7eLET14cROi9+5HAVbbHuIWUHEauBv5qT4Av2tWasiTY1Jw6puUNqRJXQg=="
     },
     "nanoassert": {
       "version": "1.1.0",
@@ -3154,9 +3143,9 @@
       "integrity": "sha512-8/JCaftHwbd//k6y2rEWp6k1wxVfpFzB6t1p825+cUb7Ym2XQfhwIC5KwhrvzZRJu+LtDE585zVaS32+CGtf0g=="
     },
     "npm-packlist": {
-      "version": "1.4.1",
-      "resolved": "https://registry.npmjs.org/npm-packlist/-/npm-packlist-1.4.1.tgz",
-      "integrity": "sha512-+TcdO7HJJ8peiiYhvPxsEDhF3PJFGUGRcFsGve3vxvxdcpO2Z4Z7rkosRM0kWj6LfbK/P0gu3dzk5RU1ffvFcw==",
+      "version": "1.4.4",
+      "resolved": "https://registry.npmjs.org/npm-packlist/-/npm-packlist-1.4.4.tgz",
+      "integrity": "sha512-zTLo8UcVYtDU3gdeaFu2Xu0n0EvelfHDGuqtNIn5RO7yQj4H1TqNdBc/yZjxnWA0PVB8D3Woyp0i5B43JwQ6Vw==",
       "requires": {
         "ignore-walk": "^3.0.1",
         "npm-bundled": "^1.0.1"
@@ -3374,9 +3363,9 @@
       "integrity": "sha1-nJRWmJ6fZYgBewQ01WCXZ1w9oF4="
     },
     "parse-dat-url": {
-      "version": "3.0.1",
-      "resolved": "https://registry.npmjs.org/parse-dat-url/-/parse-dat-url-3.0.1.tgz",
-      "integrity": "sha512-xVq8RDzqy9xlMh43h3iGkak2T8Bk2IRQUTo8eVdGJp8xrk62/OkS+RMAou/cxLAjoTuY0YbYbmxVUemE78NISA=="
+      "version": "3.0.3",
+      "resolved": "https://registry.npmjs.org/parse-dat-url/-/parse-dat-url-3.0.3.tgz",
+      "integrity": "sha512-7a/rNzaZqhOHlZ1rwxz4xmERI47PpnAkuqbnkne9IH91D/pQ2T0+g5jK9kVUCp+jKHYRA0j4kbsyaluiF9XoaA=="
     },
     "parse-filepath": {
       "version": "1.0.2",
@@ -3662,9 +3651,9 @@
       "integrity": "sha1-FuBXkYje9WvbVliSvNBaXWUySAc="
     },
     "process-nextick-args": {
-      "version": "2.0.0",
-      "resolved": "https://registry.npmjs.org/process-nextick-args/-/process-nextick-args-2.0.0.tgz",
-      "integrity": "sha512-MtEC1TqN0EU5nephaJ4rAtThHtC86dNN9qCuEhtshvpVBkAW5ZO7BASN9REnF9eoXGcRub+pFuKEpOHE+HbEMw=="
+      "version": "2.0.1",
+      "resolved": "https://registry.npmjs.org/process-nextick-args/-/process-nextick-args-2.0.1.tgz",
+      "integrity": "sha512-3ouUOpQhtgrbOa17J7+uxOTpITYWaGP7/AhoR3+A+/1e9skrzelGi/dXzEYyvbxubEF6Wn2ypscTKiKJFFn1ag=="
     },
     "progress": {
       "version": "2.0.3",
@@ -3688,9 +3677,9 @@
       "dev": true
     },
     "psl": {
-      "version": "1.1.32",
-      "resolved": "https://registry.npmjs.org/psl/-/psl-1.1.32.tgz",
-      "integrity": "sha512-MHACAkHpihU/REGGPLj4sEfc/XKW2bheigvHO1dUqjaKigMp1C8+WLQYRGgeKFMsw5PMfegZcaN8IDXK/cD0+g=="
+      "version": "1.3.0",
+      "resolved": "https://registry.npmjs.org/psl/-/psl-1.3.0.tgz",
+      "integrity": "sha512-avHdspHO+9rQTLbv1RO+MPYeP/SzsCoxofjVnHanETfQhTJrmB0HlDoW+EiN/R+C0BZ+gERab9NY0lPN2TxNag=="
     },
     "pump": {
       "version": "3.0.0",
@@ -3732,9 +3721,9 @@
       }
     },
     "random-access-storage": {
-      "version": "1.3.0",
-      "resolved": "https://registry.npmjs.org/random-access-storage/-/random-access-storage-1.3.0.tgz",
-      "integrity": "sha512-pdS9Mcb9TB7oICypPRALlheaSuszuAKmLVEPKJMuYor7R/zDuHh5ALuQoS+ox31XRwQUL+tDwWH2GPdyspwelA==",
+      "version": "1.4.0",
+      "resolved": "https://registry.npmjs.org/random-access-storage/-/random-access-storage-1.4.0.tgz",
+      "integrity": "sha512-7oszloM/+PdqWp/oFGyL6SeI14liqo8AAisHAZQGkWdHISyAnngKjNPL0JYIazeLxbHPY6oed2yUffowdq/o6A==",
       "requires": {
         "inherits": "^2.0.3"
       }
@@ -3811,9 +3800,9 @@
       }
     },
     "regenerator-runtime": {
-      "version": "0.13.2",
-      "resolved": "https://registry.npmjs.org/regenerator-runtime/-/regenerator-runtime-0.13.2.tgz",
-      "integrity": "sha512-S/TQAZJO+D3m9xeN1WTI8dLKBBiRgXBlTJvbWjCThHWZj9EvHK70Ff50/tYj2J/fvBY6JtFVwRuazHN2E7M9BA=="
+      "version": "0.13.3",
+      "resolved": "https://registry.npmjs.org/regenerator-runtime/-/regenerator-runtime-0.13.3.tgz",
+      "integrity": "sha512-naKIZz2GQ8JWh///G7L3X6LaQUAMp2lvb1rvwwsURe/VXwD6VMfr+/1NuNw3ag8v2kY1aQ/go5SNn79O9JU7yw=="
     },
     "regex-cache": {
       "version": "0.4.4",
@@ -3891,9 +3880,9 @@
       }
     },
     "resolve": {
-      "version": "1.11.0",
-      "resolved": "https://registry.npmjs.org/resolve/-/resolve-1.11.0.tgz",
-      "integrity": "sha512-WL2pBDjqT6pGUNSUzMw00o4T7If+z4H2x3Gz893WoUQ5KW8Vr9txp00ykiP16VBaZF5+j/OcXJHZ9+PCvdiDKw==",
+      "version": "1.12.0",
+      "resolved": "https://registry.npmjs.org/resolve/-/resolve-1.12.0.tgz",
+      "integrity": "sha512-B/dOmuoAik5bKcD6s6nXDCjzUKnaDvdkRyAk6rsmsKLipWj4797iothd7jmmUhWTfinVMU+wc56rYKsit2Qy4w==",
       "requires": {
         "path-parse": "^1.0.6"
       }
@@ -4012,9 +4001,9 @@
       "integrity": "sha1-BF+XgtARrppoA93TgrJDkrPYkPc="
     },
     "set-value": {
-      "version": "2.0.0",
-      "resolved": "https://registry.npmjs.org/set-value/-/set-value-2.0.0.tgz",
-      "integrity": "sha512-hw0yxk9GT/Hr5yJEYnHNKYXkIA8mVJgd9ditYZCe16ZczcaELYYcfvaXesNACk2O8O0nTiPQcQhGUQj8JLzeeg==",
+      "version": "2.0.1",
+      "resolved": "https://registry.npmjs.org/set-value/-/set-value-2.0.1.tgz",
+      "integrity": "sha512-JxHc1weCN68wRY0fhCoXpyK55m/XPHafOmK4UWD7m2CI14GMcFypt4w/0+NV5f/ZMby2F6S2wwA7fgynh9gWSw==",
       "requires": {
         "extend-shallow": "^2.0.1",
         "is-extendable": "^0.1.1",
@@ -4213,9 +4202,9 @@
       }
     },
     "sodium-native": {
-      "version": "2.4.2",
-      "resolved": "https://registry.npmjs.org/sodium-native/-/sodium-native-2.4.2.tgz",
-      "integrity": "sha512-qwHcUnzFpRSGSm6F49j/h5SnxPFBgSNdDwZkAqjvuAoHQIVBFOXYb+oCUTJV80K5hRqSYCihpbX06vbrtPbilg==",
+      "version": "2.4.3",
+      "resolved": "https://registry.npmjs.org/sodium-native/-/sodium-native-2.4.3.tgz",
+      "integrity": "sha512-UCj3G++buo7HFADLMXyG+K7trEl6h17lde/2Sd3Al9ozcfPIQyKohmVqDncHY7ZggWkhzdwHKyDnlFWFQHZ5pg==",
       "optional": true,
       "requires": {
         "ini": "^1.3.5",
@@ -4292,19 +4281,12 @@
       "integrity": "sha512-z/wAiTESw2XVPssY2XRcme4niTc4S5FkkJ4gknudtVoc33Zil8TdTxHy5torRcgqMqksJV2Yz8HQcvtbsnw0mQ=="
     },
     "spellchecker": {
-      "version": "3.6.1",
-      "resolved": "https://registry.npmjs.org/spellchecker/-/spellchecker-3.6.1.tgz",
-      "integrity": "sha512-i7qp5m/JpZqs+3LanJW6hhlXTX/m9+x8jvZvOuG/V3XlWHLsCsJQdOvGAXIU8ZHA1wuv1VRPJLpfVI8/e/ZBOg==",
+      "version": "3.7.0",
+      "resolved": "https://registry.npmjs.org/spellchecker/-/spellchecker-3.7.0.tgz",
+      "integrity": "sha512-saQT4BR9nivbK70s0YjyIlSbZzO6bfWRULcGL2JU7fi7wotOnWl70P0QoUwwLywNQJQ47osgCo6GmOlqzRTxbQ==",
       "requires": {
         "any-promise": "^1.3.0",
         "nan": "^2.14.0"
-      },
-      "dependencies": {
-        "nan": {
-          "version": "2.14.0",
-          "resolved": "https://registry.npmjs.org/nan/-/nan-2.14.0.tgz",
-          "integrity": "sha512-INOFj37C7k3AfaNTtX8RhsTw7qRy7eLET14cROi9+5HAVbbHuIWUHEauBv5qT4Av2tWasiTY1Jw6puUNqRJXQg=="
-        }
       }
     },
     "split-string": {
@@ -4329,9 +4311,8 @@
       "integrity": "sha1-BOaSb2YolTVPPdAVIDYzuFcpfiw="
     },
     "sqlite3": {
-      "version": "4.0.9",
-      "resolved": "https://registry.npmjs.org/sqlite3/-/sqlite3-4.0.9.tgz",
-      "integrity": "sha512-IkvzjmsWQl9BuBiM4xKpl5X8WCR4w0AeJHRdobCdXZ8dT/lNc1XS6WqvY35N6+YzIIgzSBeY5prdFObID9F9tA==",
+      "version": "github:pdesantis/node-sqlite3#cdbb94319a4e1e15595708ec80da421ea740089c",
+      "from": "github:pdesantis/node-sqlite3#cdbb94319a4e1e15595708ec80da421ea740089c",
       "requires": {
         "nan": "^2.12.1",
         "node-pre-gyp": "^0.11.0",
@@ -4588,9 +4569,9 @@
       "dev": true
     },
     "textextensions": {
-      "version": "2.4.0",
-      "resolved": "https://registry.npmjs.org/textextensions/-/textextensions-2.4.0.tgz",
-      "integrity": "sha512-qftQXnX1DzpSV8EddtHIT0eDDEiBF8ywhFYR2lI9xrGtxqKN+CvLXhACeCIGbCpQfxxERbrkZEFb8cZcDKbVZA=="
+      "version": "2.5.0",
+      "resolved": "https://registry.npmjs.org/textextensions/-/textextensions-2.5.0.tgz",
+      "integrity": "sha512-1IkVr355eHcomgK7fgj1Xsokturx6L5S2JRT5WcRdA6v5shk9sxWuO/w/VbpQexwkXJMQIa/j1dBi3oo7+HhcA=="
     },
     "through": {
       "version": "2.3.8",
@@ -4758,35 +4739,14 @@
       "integrity": "sha1-5z3T17DXxe2G+6xrCufYxqadUPo="
     },
     "union-value": {
-      "version": "1.0.0",
-      "resolved": "https://registry.npmjs.org/union-value/-/union-value-1.0.0.tgz",
-      "integrity": "sha1-XHHDTLW61dzr4+oM0IIHulqhrqQ=",
+      "version": "1.0.1",
+      "resolved": "https://registry.npmjs.org/union-value/-/union-value-1.0.1.tgz",
+      "integrity": "sha512-tJfXmxMeWYnczCVs7XAEvIV7ieppALdyepWMkHkwciRpZraG/xwT+s2JN8+pr1+8jCRf80FFzvr+MpQeeoF4Xg==",
       "requires": {
         "arr-union": "^3.1.0",
         "get-value": "^2.0.6",
         "is-extendable": "^0.1.1",
-        "set-value": "^0.4.3"
-      },
-      "dependencies": {
-        "extend-shallow": {
-          "version": "2.0.1",
-          "resolved": "https://registry.npmjs.org/extend-shallow/-/extend-shallow-2.0.1.tgz",
-          "integrity": "sha1-Ua99YUrZqfYQ6huvu5idaxxWiQ8=",
-          "requires": {
-            "is-extendable": "^0.1.0"
-          }
-        },
-        "set-value": {
-          "version": "0.4.3",
-          "resolved": "https://registry.npmjs.org/set-value/-/set-value-0.4.3.tgz",
-          "integrity": "sha1-fbCPnT0i3H945Trzw79GZuzfzPE=",
-          "requires": {
-            "extend-shallow": "^2.0.1",
-            "is-extendable": "^0.1.1",
-            "is-plain-object": "^2.0.1",
-            "to-object-path": "^0.3.0"
-          }
-        }
+        "set-value": "^2.0.1"
       }
     },
     "unique-string": {
@@ -4880,9 +4840,9 @@
       "integrity": "sha1-RQ1Nyfpw3nMnYvvS1KKJgUGaDM8="
     },
     "utp-native": {
-      "version": "2.1.3",
-      "resolved": "https://registry.npmjs.org/utp-native/-/utp-native-2.1.3.tgz",
-      "integrity": "sha512-lXjmAJxlaz58GDFlEqKYkNzO5rqttA+/TVHl7UUAs8Saj1QJq/3D4IckuVpsmCsjjZod5N7sE8QMUCYScVHDpg==",
+      "version": "2.1.4",
+      "resolved": "https://registry.npmjs.org/utp-native/-/utp-native-2.1.4.tgz",
+      "integrity": "sha512-FYjr3bHBnJpw8yD0CmFCh5USyDgr6VtuncEIun100GqCUdgqnkAx9irSY3tA4UrzRH56qmiocP2fs1QjQ7ZDZA==",
       "requires": {
         "napi-macros": "^1.8.1",
         "node-gyp-build": "^3.5.0",
@@ -4892,9 +4852,9 @@
       },
       "dependencies": {
         "readable-stream": {
-          "version": "3.3.0",
-          "resolved": "https://registry.npmjs.org/readable-stream/-/readable-stream-3.3.0.tgz",
-          "integrity": "sha512-EsI+s3k3XsW+fU8fQACLN59ky34AZ14LoeVZpYwmZvldCFo0r0gnelwF2TcMjLor/BTL5aDJVBMkss0dthToPw==",
+          "version": "3.4.0",
+          "resolved": "https://registry.npmjs.org/readable-stream/-/readable-stream-3.4.0.tgz",
+          "integrity": "sha512-jItXPLmrSR8jmTRmRWJXCnGJsfy85mB3Wd/uINMXA65yrnFo0cPClFIUWzo2najVNSl+mx7/4W8ttlLWJe99pQ==",
           "requires": {
             "inherits": "^2.0.3",
             "string_decoder": "^1.1.1",
@@ -5014,9 +4974,9 @@
       "integrity": "sha512-g1DFmZ5JJ9Qzvt4dMw6m9IydqoCSP381ucU5zm46Owbk3bwmqAr8eEJirOPc7PrXRn45drzOpAyDp8jsnoyXyw=="
     },
     "xtend": {
-      "version": "4.0.1",
-      "resolved": "https://registry.npmjs.org/xtend/-/xtend-4.0.1.tgz",
-      "integrity": "sha1-pcbVMr5lbiPbgg77lDofBJmNY68="
+      "version": "4.0.2",
+      "resolved": "https://registry.npmjs.org/xtend/-/xtend-4.0.2.tgz",
+      "integrity": "sha512-LKYU1iAXJXUgAXn9URjiu+MWhyUXHsvfp7mcuYm9dSUKK0/CjtrUwFAxD82/mCWbtLsGjFIad0wIsod4zrTAEQ=="
     },
     "yallist": {
       "version": "3.0.3",
diff --git a/package.json b/package.json
index 5984f2a2..8ddaa0db 100644
--- a/package.json
+++ b/package.json
@@ -29,7 +29,7 @@
     "@beaker/dat-serve-resolve-path": "^1.0.0",
     "@beaker/dat-session-data-ext-msg": "^1.1.0",
     "@beaker/datignore": "^1.0.0",
-    "ajv": "^6.7.0",
+    "ajv": "^6.10.2",
     "anymatch": "^2.0.0",
     "await-lock": "^1.1.3",
     "beaker-error-constants": "^1.4.0",
@@ -48,8 +48,8 @@
     "fs-jetpack": "^1.3.1",
     "fs-reverse": "0.0.3",
     "function-queue": "0.0.12",
-    "hypercore-protocol": "^6.11.0",
-    "hyperdrive": "^9.14.5",
+    "hypercore-protocol": "^6.11.1",
+    "hyperdrive": "^9.16.0",
     "hyperdrive-network-speed": "^2.1.0",
     "icojs": "^0.12.3",
     "identify-filetype": "^1.0.0",
@@ -71,7 +71,7 @@
     "normalize-url": "^3.3.0",
     "once": "^1.4.0",
     "os-locale": "^3.1.0",
-    "parse-dat-url": "^3.0.1",
+    "parse-dat-url": "^3.0.3",
     "pauls-dat-api": "^8.1.0",
     "pify": "^3.0.0",
     "pump": "^3.0.0",
@@ -83,14 +83,14 @@
     "semver": "^5.7.0",
     "slugify": "^1.3.4",
     "sodium-signatures": "^2.1.1",
-    "spellchecker": "^3.6.1",
+    "spellchecker": "^3.7.0",
     "split2": "^2.2.0",
-    "sqlite3": "^4.0.9",
+    "sqlite3": "github:pdesantis/node-sqlite3#cdbb94319a4e1e15595708ec80da421ea740089c",
     "stream-throttle": "^0.1.3",
     "supports-sparse-files": "^1.0.2",
-    "textextensions": "^2.4.0",
+    "textextensions": "^2.5.0",
     "through2": "^2.0.5",
-    "utp-native": "^2.1.3",
+    "utp-native": "^2.1.4",
     "winston": "github:winstonjs/winston#b4ced895b3e1ead8a616590189b003cfd9d7acca",
     "yazl": "^2.5.1"
   },

From 5109f2e56ae86856026ff80513f669df1aa72e5b Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 2 Aug 2019 15:28:07 -0500
Subject: [PATCH 232/245] Go back to sqlite3 main package

---
 package.json | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/package.json b/package.json
index 8ddaa0db..b8a941b9 100644
--- a/package.json
+++ b/package.json
@@ -85,7 +85,7 @@
     "sodium-signatures": "^2.1.1",
     "spellchecker": "^3.7.0",
     "split2": "^2.2.0",
-    "sqlite3": "github:pdesantis/node-sqlite3#cdbb94319a4e1e15595708ec80da421ea740089c",
+    "sqlite3": "^4.0.9",
     "stream-throttle": "^0.1.3",
     "supports-sparse-files": "^1.0.2",
     "textextensions": "^2.5.0",

From 5e61d561fab83ce2d804b2a2aca1a85946eb848e Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Fri, 2 Aug 2019 16:15:45 -0500
Subject: [PATCH 233/245] Fix syntax error in profile-data.sql.js

---
 dbs/schemas/profile-data.sql.js | 2 +-
 package-lock.json               | 5 +++--
 2 files changed, 4 insertions(+), 3 deletions(-)

diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index 085e715c..58633152 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -142,7 +142,7 @@ CREATE TABLE templates (
 CREATE TABLE crawl_sources (
   id INTEGER PRIMARY KEY NOT NULL,
   url TEXT NOT NULL,
-  datDnsId INTEGER,
+  datDnsId INTEGER
 );
 
 -- tracking information on the crawl-state of the sources
diff --git a/package-lock.json b/package-lock.json
index cba824ee..d891427f 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -4311,8 +4311,9 @@
       "integrity": "sha1-BOaSb2YolTVPPdAVIDYzuFcpfiw="
     },
     "sqlite3": {
-      "version": "github:pdesantis/node-sqlite3#cdbb94319a4e1e15595708ec80da421ea740089c",
-      "from": "github:pdesantis/node-sqlite3#cdbb94319a4e1e15595708ec80da421ea740089c",
+      "version": "4.0.9",
+      "resolved": "https://registry.npmjs.org/sqlite3/-/sqlite3-4.0.9.tgz",
+      "integrity": "sha512-IkvzjmsWQl9BuBiM4xKpl5X8WCR4w0AeJHRdobCdXZ8dT/lNc1XS6WqvY35N6+YzIIgzSBeY5prdFObID9F9tA==",
       "requires": {
         "nan": "^2.12.1",
         "node-pre-gyp": "^0.11.0",

From 28df9f9fb8e5c5091580d2de96b00a0799e1ec0d Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 4 Aug 2019 12:44:15 -0500
Subject: [PATCH 234/245] Add simple theme/template.html serving

---
 dat/protocol.js | 18 +++++++++++++++++-
 lib/mime.js     |  4 ++--
 2 files changed, 19 insertions(+), 3 deletions(-)

diff --git a/dat/protocol.js b/dat/protocol.js
index 50bead63..b1b946fe 100644
--- a/dat/protocol.js
+++ b/dat/protocol.js
@@ -1,4 +1,4 @@
-const {join} = require('path')
+const {extname} = require('path')
 const parseDatUrl = require('parse-dat-url')
 const parseRange = require('range-parser')
 const once = require('once')
@@ -206,6 +206,22 @@ exports.electronHandler = async function (request, respond) {
   var headers = {}
   var entry = await datServeResolvePath(checkoutFS.pda, manifest, urlp, request.headers.Accept)
 
+  // use theme template if it exists
+  if (!urlp.query.disable_theme) {
+    if (entry && mime.acceptHeaderWantsHTML(request.headers.Accept) && ['.html', '.htm', '.md'].includes(extname(entry.path))) {
+      let template = await checkoutFS.pda.readFile('/theme/template.html', 'utf8').catch(err => null)
+      if (template) {
+        return respond({
+          statusCode: 200,
+          headers: Object.assign(headers, {
+            'Content-Type': 'text/html'
+          }),
+          data: intoStream(template)
+        })
+      }
+    }
+  }
+
   // handle folder
   if (entry && entry.isDirectory()) {
     cleanup()
diff --git a/lib/mime.js b/lib/mime.js
index 74120f3b..eb5d8405 100644
--- a/lib/mime.js
+++ b/lib/mime.js
@@ -110,11 +110,11 @@ exports.acceptHeaderExtensions = function (accept) {
 }
 
 /**
- * For a given HTTP accept header, should markdown be converted to HTML?
+ * For a given HTTP accept header, is HTML wanted?
  * @param {string | undefined} accept
  * @returns {boolean}
  */
-exports.acceptHeaderMarkdownToHtml = function (accept) {
+exports.acceptHeaderWantsHTML = function (accept) {
   var parts = (accept || '').split(',')
   return (parts.includes('text/html') || (parts.length === 1 && parts[0] === '*/*'))
 }

From faccc1465a86f3c0d3fa0008d8daed6e7d0f7032 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 4 Aug 2019 12:46:49 -0500
Subject: [PATCH 235/245] Fix misnamed fn

---
 dat/protocol.js | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/dat/protocol.js b/dat/protocol.js
index b1b946fe..432521ba 100644
--- a/dat/protocol.js
+++ b/dat/protocol.js
@@ -304,7 +304,7 @@ exports.electronHandler = async function (request, respond) {
   })
 
   // markdown rendering
-  if (!range && entry.path.endsWith('.md') && mime.acceptHeaderMarkdownToHtml(request.headers.Accept)) {
+  if (!range && entry.path.endsWith('.md') && mime.acceptHeaderWantsHTML(request.headers.Accept)) {
     let content = await checkoutFS.pda.readFile(entry.path, 'utf8')
     return respond({
       statusCode: 200,

From 59d9f08b1e59084b2acf2c6d23925e014b4b48ce Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 5 Aug 2019 11:23:07 -0500
Subject: [PATCH 236/245] Fix: catch failed reads when confirming domain names

---
 dat/library.js | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/dat/library.js b/dat/library.js
index 8208cda6..6a656315 100644
--- a/dat/library.js
+++ b/dat/library.js
@@ -598,8 +598,12 @@ const getPrimaryUrl = exports.getPrimaryUrl = async function (url) {
  */
 const confirmDomain = exports.confirmDomain = async function (key) {
   // fetch the current domain from the manifest
-  var archive = await getOrLoadArchive(key)
-  var datJson = await archive.pda.readManifest()
+  try {
+    var archive = await getOrLoadArchive(key)
+    var datJson = await archive.pda.readManifest()
+  } catch (e) {
+    return false
+  }
   if (!datJson.domain) {
     await datDnsDb.unset(key)
     return false

From ff9db2f0fdac2e314a5ac4e4e06419bcfc803dbf Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 5 Aug 2019 13:04:31 -0500
Subject: [PATCH 237/245] Update search API suggestions to use themes and
 remove apps & templates

---
 crawler/search.js | 29 +++++++----------------------
 1 file changed, 7 insertions(+), 22 deletions(-)

diff --git a/crawler/search.js b/crawler/search.js
index 48e42073..a8d7e0c7 100644
--- a/crawler/search.js
+++ b/crawler/search.js
@@ -12,9 +12,7 @@ const users = require('../users')
 
 const KNOWN_SITE_TYPES = [
   'unwalled.garden/person',
-  'application',
-  'unwalled.garden/module',
-  'unwalled.garden/template'
+  'unwalled.garden/theme'
 ]
 
 // typedefs
@@ -26,10 +24,9 @@ const KNOWN_SITE_TYPES = [
  *
  * @typedef {Object} SuggestionResults
  * @prop {Array<Object>} bookmarks
- * @prop {Array<Object>} apps
  * @prop {Array<Object>} websites
  * @prop {Array<Object>} people
- * @prop {Array<Object>} templates
+ * @prop {Array<Object>} themes
  * @prop {(undefined|Array<Object>)} history
  *
  * TODO: define the SuggestionResults values
@@ -92,10 +89,9 @@ const KNOWN_SITE_TYPES = [
 exports.listSuggestions = async function (user, query = '', opts = {}) {
   var suggestions = {
     bookmarks: [],
-    apps: [],
     websites: [],
     people: [],
-    templates: [],
+    themes: [],
     history: undefined
   }
   const filterFn = a => query ? ((a.url || a.href).includes(query) || a.title.toLowerCase().includes(query)) : true
@@ -122,17 +118,6 @@ exports.listSuggestions = async function (user, query = '', opts = {}) {
   bookmarkResults = bookmarkResults.slice(0, 12)
   suggestions.bookmarks = bookmarkResults.map(b => ({title: b.title, url: b.href}))
 
-  // apps
-  suggestions.apps = await db.all(knex('installed_applications').where({userId}))
-  await Promise.all(suggestions.apps.map(async (record) => {
-    var archiveInfo = await datLibrary.getArchiveInfo(record.url)
-    record.title = archiveInfo.title
-  }))
-  suggestions.apps = (await datLibrary.queryArchives({isSaved: true, type: 'application'})).concat(suggestions.apps)
-  suggestions.apps = dedup(suggestions.apps)
-  suggestions.apps = suggestions.apps.filter(filterFn)
-  suggestions.apps.sort(sortFn)
-
   // websites
   suggestions.websites = /** @type LibraryArchiveRecord[] */(await datLibrary.queryArchives({isSaved: true}))
   suggestions.websites = suggestions.websites.filter(w => (
@@ -149,10 +134,10 @@ exports.listSuggestions = async function (user, query = '', opts = {}) {
   suggestions.people = suggestions.people.filter(filterFn)
   suggestions.people.sort(sortFn)
 
-  // templates
-  suggestions.templates = /** @type LibraryArchiveRecord[] */(await datLibrary.queryArchives({isSaved: true, type: 'unwalled.garden/template'}))
-  suggestions.templates = suggestions.templates.filter(filterFn)
-  suggestions.templates.sort(sortFn)
+  // themes
+  suggestions.themes = /** @type LibraryArchiveRecord[] */(await datLibrary.queryArchives({isSaved: true, type: 'unwalled.garden/theme'}))
+  suggestions.themes = suggestions.themes.filter(filterFn)
+  suggestions.themes.sort(sortFn)
 
   if (query) {
     // history

From a7fb77d01178cdcb3439a8387b7d16aa19bfa4dd Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 5 Aug 2019 13:55:59 -0500
Subject: [PATCH 238/245] Drop the beaker* prefix on navigator methods

---
 web-apis/bg/navigator.js                 | 6 +++---
 web-apis/manifests/external/navigator.js | 6 +++---
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/web-apis/bg/navigator.js b/web-apis/bg/navigator.js
index 1f2a2d58..e01dbe6a 100644
--- a/web-apis/bg/navigator.js
+++ b/web-apis/bg/navigator.js
@@ -30,7 +30,7 @@ module.exports = {
    * @param {boolean} [opts.disallowCreate]
    * @returns {Promise<string[]>}
    */
-  async beakerSelectFileDialog (opts = {}) {
+  async selectFileDialog (opts = {}) {
     var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
 
@@ -80,7 +80,7 @@ module.exports = {
    * @param {boolean} [opts.filters.networked]
    * @returns {Promise<string[]>}
    */
-  async beakerSaveFileDialog (opts = {}) {
+  async saveFileDialog (opts = {}) {
     var userSession = globals.userSessionAPI.getFor(this.sender)
     if (!userSession) throw new Error('No active user session')
 
@@ -125,7 +125,7 @@ module.exports = {
    * @param {string} [opts.filters.type]
    * @returns {Promise<string[]>}
    */
-  async beakerSelectDatArchiveDialog (opts = {}) {
+  async selectDatArchiveDialog (opts = {}) {
     // validate
     assert(opts && typeof opts === 'object', 'Must pass an options object')
     assert(!opts.title || typeof opts.title === 'string', '.title must be a string')
diff --git a/web-apis/manifests/external/navigator.js b/web-apis/manifests/external/navigator.js
index 1979bfbb..d955186e 100644
--- a/web-apis/manifests/external/navigator.js
+++ b/web-apis/manifests/external/navigator.js
@@ -1,6 +1,6 @@
 module.exports = {
-  beakerSelectFileDialog: 'promise',
-  beakerSaveFileDialog: 'promise',
-  beakerSelectDatArchiveDialog: 'promise',
+  selectFileDialog: 'promise',
+  saveFileDialog: 'promise',
+  selectDatArchiveDialog: 'promise',
   getApplicationState: 'promise'
 }
\ No newline at end of file

From e07681f19076e91f6f7a2f52a1a10cab6f1413c7 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Mon, 5 Aug 2019 13:56:55 -0500
Subject: [PATCH 239/245] Disable navigator.getApplicationState

---
 web-apis/bg/navigator.js                 | 9 +++++----
 web-apis/manifests/external/navigator.js | 2 +-
 2 files changed, 6 insertions(+), 5 deletions(-)

diff --git a/web-apis/bg/navigator.js b/web-apis/bg/navigator.js
index e01dbe6a..71c5886c 100644
--- a/web-apis/bg/navigator.js
+++ b/web-apis/bg/navigator.js
@@ -152,10 +152,11 @@ module.exports = {
   /**
    * @returns {Promise<ApplicationState>}
    */
-  async getApplicationState () {
-    var userId = await appPerms.getSessionUserId(this.sender)
-    return applications.getApplicationState({url: this.sender.getURL(), userId})
-  }
+  // DISABLED
+  // async getApplicationState () {
+  //   var userId = await appPerms.getSessionUserId(this.sender)
+  //   return applications.getApplicationState({url: this.sender.getURL(), userId})
+  // }
 }
 
 function isStrArray (v) {
diff --git a/web-apis/manifests/external/navigator.js b/web-apis/manifests/external/navigator.js
index d955186e..5af32291 100644
--- a/web-apis/manifests/external/navigator.js
+++ b/web-apis/manifests/external/navigator.js
@@ -2,5 +2,5 @@ module.exports = {
   selectFileDialog: 'promise',
   saveFileDialog: 'promise',
   selectDatArchiveDialog: 'promise',
-  getApplicationState: 'promise'
+  // getApplicationState: 'promise' DISABLED
 }
\ No newline at end of file

From f5927e475390a915927f56ddc8e24724275ff2cd Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 6 Aug 2019 11:46:26 -0500
Subject: [PATCH 240/245] Move from app perms to session perms, add
 navigator.session.* web api

---
 applications.js                               |   4 +-
 dbs/profile-data-db.js                        |   3 +-
 dbs/schemas/profile-data.sql.js               |  12 +-
 dbs/schemas/profile-data.v36.sql.js           |  12 ++
 dbs/sitedata.js                               |  63 --------
 lib/app-perms.js                              | 103 ------------
 lib/session-perms.js                          | 146 ++++++++++++++++++
 users/site-sessions.js                        | 101 ++++++++++++
 web-apis/bg.js                                |   3 +
 web-apis/bg/applications.js                   |  24 +--
 web-apis/bg/bookmarks.js                      |  18 +--
 web-apis/bg/navigator-session.js              | 123 +++++++++++++++
 web-apis/bg/navigator.js                      |   4 +-
 web-apis/bg/unwalled-garden-comments.js       |  20 +--
 web-apis/bg/unwalled-garden-discussions.js    |  18 +--
 web-apis/bg/unwalled-garden-follows.js        |  18 +--
 web-apis/bg/unwalled-garden-media.js          |  18 +--
 web-apis/bg/unwalled-garden-posts.js          |  18 +--
 web-apis/bg/unwalled-garden-profiles.js       |   8 +-
 web-apis/bg/unwalled-garden-reactions.js      |  14 +-
 web-apis/bg/unwalled-garden-tags.js           |   8 +-
 web-apis/bg/unwalled-garden-votes.js          |  12 +-
 web-apis/fg/beaker.js                         |   3 -
 web-apis/fg/navigator-methods.js              |  13 +-
 .../manifests/external/navigator-session.js   |   5 +
 web-apis/manifests/internal/sitedata.js       |   3 -
 26 files changed, 507 insertions(+), 267 deletions(-)
 create mode 100644 dbs/schemas/profile-data.v36.sql.js
 delete mode 100644 lib/app-perms.js
 create mode 100644 lib/session-perms.js
 create mode 100644 users/site-sessions.js
 create mode 100644 web-apis/bg/navigator-session.js
 create mode 100644 web-apis/manifests/external/navigator-session.js

diff --git a/applications.js b/applications.js
index 3051b94b..654a0651 100644
--- a/applications.js
+++ b/applications.js
@@ -1,4 +1,4 @@
-const appPerms = require('./lib/app-perms')
+const sessionPerms = require('./lib/session-perms')
 const knex = require('./lib/knex')
 const db = require('./dbs/profile-data-db')
 const sitedataDb = require('./dbs/sitedata')
@@ -60,7 +60,7 @@ function massageAppRecord (record) {
     permissions: Object.entries(record.permissions).map(([id, caps]) => ({
       id,
       caps,
-      description: appPerms.describePerm(id, caps)
+      description: sessionPerms.describePerm(id, caps)
     })),
     installed: record.installed,
     enabled: Boolean(record.enabled),
diff --git a/dbs/profile-data-db.js b/dbs/profile-data-db.js
index d2314cca..9e3b6641 100644
--- a/dbs/profile-data-db.js
+++ b/dbs/profile-data-db.js
@@ -122,7 +122,8 @@ migrations = [
   migration('profile-data.v32.sql'),
   migration('profile-data.v33.sql'),
   migration('profile-data.v34.sql'),
-  migration('profile-data.v35.sql')
+  migration('profile-data.v35.sql'),
+  migration('profile-data.v36.sql')
 ]
 function migration (file, opts = {}) {
   return cb => {
diff --git a/dbs/schemas/profile-data.sql.js b/dbs/schemas/profile-data.sql.js
index 58633152..9adff13b 100644
--- a/dbs/schemas/profile-data.sql.js
+++ b/dbs/schemas/profile-data.sql.js
@@ -14,6 +14,16 @@ CREATE TABLE users (
   createdAt INTEGER
 );
 
+CREATE TABLE user_site_sessions (
+  id INTEGER PRIMARY KEY NOT NULL,
+  userId INTEGER NOT NULL,
+  url TEXT,
+  permissionsJson TEXT,
+  createdAt INTEGER,
+ 
+  FOREIGN KEY (userId) REFERENCES users (id) ON DELETE CASCADE
+);
+
 CREATE TABLE archives (
   profileId INTEGER NOT NULL,
   key TEXT NOT NULL, -- dat key
@@ -466,5 +476,5 @@ INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Support Beaker
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Library', 'beaker://library/', 1);
 INSERT INTO bookmarks (profileId, title, url, pinned) VALUES (0, 'Beaker.Social', 'dat://beaker.social', 1);
 
-PRAGMA user_version = 35;
+PRAGMA user_version = 36;
 `
diff --git a/dbs/schemas/profile-data.v36.sql.js b/dbs/schemas/profile-data.v36.sql.js
new file mode 100644
index 00000000..c79e2063
--- /dev/null
+++ b/dbs/schemas/profile-data.v36.sql.js
@@ -0,0 +1,12 @@
+module.exports = `
+CREATE TABLE user_site_sessions (
+  id INTEGER PRIMARY KEY NOT NULL,
+  userId INTEGER NOT NULL,
+  url TEXT,
+  permissionsJson TEXT,
+  createdAt INTEGER,
+ 
+  FOREIGN KEY (userId) REFERENCES users (id) ON DELETE CASCADE
+);
+PRAGMA user_version = 36;
+`
\ No newline at end of file
diff --git a/dbs/sitedata.js b/dbs/sitedata.js
index 030dd1f5..becfb0e4 100644
--- a/dbs/sitedata.js
+++ b/dbs/sitedata.js
@@ -136,42 +136,6 @@ exports.getNetworkPermissions = async function (url) {
   })
 }
 
-/**
- * @param {string} url
- * @returns {Promise<Object>}
- */
-const getAppPermissions = exports.getAppPermissions = async function (url) {
-  await setupPromise
-  var origin = await extractOrigin(url)
-  if (!origin) return null
-  return cbPromise(cb => {
-    db.all(`SELECT key, value FROM sitedata WHERE origin = ? AND key LIKE 'perm:app:%'`, [origin], (err, rows) => {
-      if (err) return cb(err)
-
-      // convert to app perms object
-      var appPerms = {}
-      if (rows) {
-        rows.forEach(row => {
-          let [perm] = row.key.split(':').slice(2)
-          appPerms[perm] = row.value.split(',')
-        })
-      }
-      cb(null, appPerms)
-    })
-  })
-}
-
-/**
- * @param {string} url
- * @returns {Promise<Object>}
- */
-const getAppPermission = exports.getAppPermission = async function (url, key) {
-  await setupPromise
-  var perm = await get(url, 'perm:app:' + key)
-  if (!perm) return []
-  return perm.split(',')
-}
-
 /**
  * @param {string} url
  * @param {string} key
@@ -183,30 +147,6 @@ const setPermission = exports.setPermission = function (url, key, value) {
   return set(url, 'perm:' + key, value)
 }
 
-/**
- * @param {string} url
- * @param {Object} appPerms
- * @returns {Promise<void>}
- */
-const setAppPermissions = exports.setAppPermissions = async function (url, appPerms) {
-  await setupPromise
-  var origin = await extractOrigin(url)
-  if (!origin) return null
-  appPerms = appPerms || {}
-
-  // clear all existing app perms
-  await cbPromise(cb => {
-    db.run(`
-      DELETE FROM sitedata WHERE origin = ? AND key LIKE 'perm:app:%'
-    `, [origin], cb)
-  })
-
-  // set perms given
-  for (let perm in appPerms) {
-    await set(url, `perm:app:${perm}`, Array.isArray(appPerms[perm]) ? appPerms[perm].join(',') : appPerms[perm])
-  }
-}
-
 /**
  * @param {string} url
  * @param {string} key
@@ -235,10 +175,7 @@ exports.WEBAPI = {
   set,
   getPermissions,
   getPermission,
-  getAppPermissions,
-  getAppPermission,
   setPermission,
-  setAppPermissions,
   clearPermission,
   clearPermissionAllOrigins
 }
diff --git a/lib/app-perms.js b/lib/app-perms.js
deleted file mode 100644
index b22506d0..00000000
--- a/lib/app-perms.js
+++ /dev/null
@@ -1,103 +0,0 @@
-const {URL} = require('url')
-const sitedataDb = require('../dbs/sitedata')
-const globals = require('../globals')
-const knex = require('../lib/knex')
-const users = require('../users')
-const datLibrary = require('../dat/library')
-const { ucfirst } = require('../lib/strings')
-const db = require('../dbs/profile-data-db')
-const { PermissionsError } = require('beaker-error-constants')
-
-const getSessionUserId = exports.getSessionUserId = async function (sender) {
-  var userSession = globals.userSessionAPI.getFor(sender)
-  if (!userSession) throw new Error('No active user session')
-  return (await users.get(userSession.url)).id
-}
-
-exports.getSessionUserArchive = async function (sender) {
-  var userSession = globals.userSessionAPI.getFor(sender)
-  if (!userSession) throw new Error('No active user session')
-  var key = await datLibrary.fromURLToKey(userSession.url, true)
-  return datLibrary.getArchive(key)
-}
-
-/**
- * @param {string} url
- * @returns {Promise<string>}
- */
-const toDatOrigin = async function (url) {
-  if (!url.startsWith('dat://')) throw new Error('Can only install dat applications')
-  return datLibrary.getPrimaryUrl(url)
-}
-
-/**
- * @param {Object} sender
- * @param {string} perm eg 'unwalled.garden/perm/comments'
- * @param {string} cap eg 'read' or 'write'
- * @returns {Promise<boolean>}
- */
-const can = exports.can = async function (sender, perm, cap) {
-  if (sender.getURL().startsWith('beaker:')) {
-    return true
-  }
-  return (await sitedataDb.getAppPermission(await toDatOrigin(sender.getURL()), perm)).includes(cap)
-}
-
-/**
- * @param {Object} sender
- * @returns {Promise<void>}
- */
-const assertInstalled = exports.assertInstalled = async function (sender) {
-  if (sender.getURL().startsWith('beaker:')) return
-  var userId = await getSessionUserId(sender)
-  var record = await db.get(knex('installed_applications').where({userId, url: await toDatOrigin(sender.getURL())}))
-  if (!(record && record.enabled != 0)) {
-    throw new PermissionsError()
-  }
-}
-
-/**
- * @param {Object} sender
- * @param {string} perm eg 'unwalled.garden/perm/comments'
- * @param {string} cap eg 'read' or 'write'
- * @returns {Promise<void>}
- */
-const assertCan = exports.assertCan = async function (sender, perm, cap) {
-  if (sender.getURL().startsWith('beaker:')) return
-  await assertInstalled(sender)
-  if (!(await can(sender, perm, cap))) {
-    throw new PermissionsError()
-  }
-}
-
-/**
- * @param {string} perm
- * @param {string[]} caps
- * @returns {string}
- */
-const describePerm = exports.describePerm = function (perm, caps) {
-  var capsStr = ucfirst(caps.join(' and '))
-  switch (perm) {
-    case 'unwalled.garden/perm/follows':
-      if (caps.includes('write')) return 'Follow and unfollow sites'
-      return 'See who you are following'
-    case 'unwalled.garden/perm/posts':
-      if (caps.includes('write')) return 'Post to your feed'
-      return `Read posts on your feed`
-    case 'unwalled.garden/perm/bookmarks':
-      return `${capsStr} bookmarks`
-    case 'unwalled.garden/perm/comments':
-      return `${capsStr} comments`
-    case 'unwalled.garden/perm/discussions':
-      return `${capsStr} discussions`
-    case 'unwalled.garden/perm/media':
-      return `${capsStr} media`
-    case 'unwalled.garden/perm/reactions':
-      return `${capsStr} reactions`
-    case 'unwalled.garden/perm/sitelists':
-      return `${capsStr} site-lists`
-    case 'unwalled.garden/perm/votes':
-      return `${capsStr} votes`
-  }
-  return false
-}
\ No newline at end of file
diff --git a/lib/session-perms.js b/lib/session-perms.js
new file mode 100644
index 00000000..32add549
--- /dev/null
+++ b/lib/session-perms.js
@@ -0,0 +1,146 @@
+const globals = require('../globals')
+const knex = require('./knex')
+const users = require('../users')
+const userSiteSessions = require('../users/site-sessions')
+const datLibrary = require('../dat/library')
+const { ucfirst } = require('./strings')
+const db = require('../dbs/profile-data-db')
+const { PermissionsError } = require('beaker-error-constants')
+
+// typedefs
+// =
+
+/**
+ * @typedef {import('../users/site-sessions').UserSiteSession} UserSiteSession
+ */
+
+// exported api
+// =
+
+const getSessionUserId = exports.getSessionUserId = async function (sender) {
+  var userSession = globals.userSessionAPI.getFor(sender)
+  if (!userSession) throw new Error('No active user session')
+  return (await users.get(userSession.url)).id
+}
+
+exports.getSessionUserArchive = async function (sender) {
+  var userSession = globals.userSessionAPI.getFor(sender)
+  if (!userSession) throw new Error('No active user session')
+  var key = await datLibrary.fromURLToKey(userSession.url, true)
+  return datLibrary.getArchive(key)
+}
+
+/**
+ * @param {string} url
+ * @returns {Promise<string>}
+ */
+const toDatOrigin = exports.toDatOrigin = async function (url) {
+  if (!url.startsWith('dat://')) throw new Error('Can only create sessions with dat sites')
+  return datLibrary.getPrimaryUrl(url)
+}
+
+/**
+ * @param {UserSiteSession} sess
+ * @param {string} perm eg 'unwalled.garden/api/comments'
+ * @param {string} cap eg 'read' or 'write'
+ * @returns {boolean}
+ */
+const can = exports.can = function (sess, perm, cap) {
+  if (cap === 'read') return true // read permissions are all allowed, at this stage, if a session exists
+  return (sess.permissions[perm] || []).includes(cap)
+}
+
+/**
+ * @param {Object} sender
+ * @returns {Promise<UserSiteSession>}
+ */
+const getSessionOrThrow = exports.getSessionOrThrow = async function (sender) {
+  if (sender.getURL().startsWith('beaker:')) return
+  var userId = await getSessionUserId(sender)
+  var session = await userSiteSessions.get(userId, await toDatOrigin(sender.getURL()))
+  if (!session) {
+    throw new PermissionsError()
+  }
+  return session
+}
+
+/**
+ * @param {Object} sender
+ * @param {string} perm eg 'unwalled.garden/api/comments'
+ * @param {string} cap eg 'read' or 'write'
+ * @returns {Promise<void>}
+ */
+const assertCan = exports.assertCan = async function (sender, perm, cap) {
+  if (sender.getURL().startsWith('beaker:')) return
+  var sess = await getSessionOrThrow(sender)
+  if (!(await can(sess, perm, cap))) {
+    throw new PermissionsError()
+  }
+}
+
+/**
+ * @description
+ * permissions automatically include read rights
+ * this function ensures the structure reflects that correctly
+ * @param {Object} perms
+ */
+exports.normalizePerms = function (perms) {
+  const ensureRead = (id) => {
+    perms[id] = perms[id] || []
+    if (!perms[id].includes('read')) {
+      perms[id].unshift('read')
+    }
+  }
+  ensureRead('unwalled.garden/api/follows')
+  ensureRead('unwalled.garden/api/posts')
+  ensureRead('unwalled.garden/api/bookmarks')
+  ensureRead('unwalled.garden/api/comments')
+  ensureRead('unwalled.garden/api/reactions')
+  ensureRead('unwalled.garden/api/votes')
+}
+
+/**
+ * @param {string} perm
+ * @returns {string}
+ */
+const getPermIcon = exports.getPermIcon = function (perm) {
+  switch (perm) {
+    case 'unwalled.garden/api/follows':
+      return 'fas fa-rss'
+    case 'unwalled.garden/api/posts':
+      return `far fa-comment-alt`
+    case 'unwalled.garden/api/bookmarks':
+      return `far fa-star`
+    case 'unwalled.garden/api/comments':
+      return `far fa-comments`
+    case 'unwalled.garden/api/reactions':
+      return `far fa-smile`
+    case 'unwalled.garden/api/votes':
+      return `fas fa-vote-yea`
+  }
+  return ''
+}
+
+/**
+ * @param {string} perm
+ * @param {string[]} caps
+ * @returns {string}
+ */
+const describePerm = exports.describePerm = function (perm, caps) {
+  var capsStr = ucfirst(caps.join(' and '))
+  switch (perm) {
+    case 'unwalled.garden/api/follows':
+      return 'Public follows'
+    case 'unwalled.garden/api/posts':
+      return `Public posts`
+    case 'unwalled.garden/api/bookmarks':
+      return `Public bookmarks`
+    case 'unwalled.garden/api/comments':
+      return `Public comments`
+    case 'unwalled.garden/api/reactions':
+      return `Public reaction emojis`
+    case 'unwalled.garden/api/votes':
+      return `Public votes`
+  }
+  return ''
+}
\ No newline at end of file
diff --git a/users/site-sessions.js b/users/site-sessions.js
new file mode 100644
index 00000000..7edef582
--- /dev/null
+++ b/users/site-sessions.js
@@ -0,0 +1,101 @@
+const db = require('../dbs/profile-data-db')
+const knex = require('../lib/knex')
+const lock = require('../lib/lock')
+
+// typedefs
+// =
+
+/**
+ * @typedef {Object} UserSiteSession
+ * @prop {number} id
+ * @prop {number} userId
+ * @prop {string} url
+ * @prop {Object} permissions
+ * @prop {Date} createdAt
+ */
+
+// globals
+// =
+
+var sessions = {} // cache of active sessions
+
+// exported api
+// =
+
+/**
+ * @param {number} userId
+ * @param {string} url
+ * @param {Object} permissions
+ * @returns {Promise<UserSiteSession>}
+ */
+exports.create = async function (userId, url, permissions) {
+  var release = await lock('user-site-sessions')
+  try {
+    delete sessions[sesskey(userId, url)]
+    await db.run(knex('user_site_sessions').where({userId, url}).delete())
+    await db.run(knex('user_site_sessions').insert({
+      userId,
+      url,
+      permissionsJson: JSON.stringify(permissions || {}),
+      createdAt: Date.now()
+    }))
+  } finally {
+    release()
+  }
+  return exports.get(userId, url)
+}
+
+/**
+ * @param {number} userId
+ * @param {string} url
+ * @returns {Promise<UserSiteSession>}
+ */
+exports.get = async function (userId, url) {
+  var sess = sessions[sesskey(userId, url)]
+  if (sess) return sess
+  var record = massageRecord(await db.get(knex('user_site_sessions').where({userId, url})))
+  if (record) sessions[sesskey(userId, url)] = record
+  return record
+}
+
+/**
+ * @param {number} userId
+ * @param {string} url
+ * @returns {Promise<void>}
+ */
+exports.destroy = async function (userId, url) {
+  var release = await lock('user-site-sessions')
+  try {
+    delete sessions[sesskey(userId, url)]
+    await db.run(knex('user_site_sessions').where({userId, url}).delete())
+  } finally {
+    release()
+  }
+}
+
+// internal methods
+// =
+
+/**
+ * @param {number} userId 
+ * @param {string} url 
+ * @returns {string}
+ */
+function sesskey (userId, url) {
+  return `${userId}|${url}`
+}
+
+/**
+ * @param {Object} record 
+ * @returns {UserSiteSession}
+ */
+function massageRecord (record) {
+  if (!record) return null
+  return {
+    id: record.id,
+    userId: record.userId,
+    url: record.url,
+    permissions: JSON.parse(record.permissionsJson),
+    createdAt: new Date(record.createdAt)
+  }
+}
\ No newline at end of file
diff --git a/web-apis/bg.js b/web-apis/bg.js
index 85347d87..f0ae4e51 100644
--- a/web-apis/bg.js
+++ b/web-apis/bg.js
@@ -28,6 +28,7 @@ const usersAPI = require('./bg/users')
 
 // external manifests
 const navigatorManifest = require('./manifests/external/navigator')
+const navigatorSessionManifest = require('./manifests/external/navigator-session')
 const datArchiveManifest = require('./manifests/external/dat-archive')
 const spellCheckerManifest = require('./manifests/external/spell-checker')
 const bookmarksManifest = require('./manifests/external/bookmarks')
@@ -45,6 +46,7 @@ const votesManifest = require('./manifests/external/unwalled-garden-votes')
 
 // external apis
 const navigatorAPI = require('./bg/navigator')
+const navigatorSessionAPI = require('./bg/navigator-session')
 const datArchiveAPI = require('./bg/dat-archive')
 const spellCheckerAPI = require('./bg/spell-checker')
 const bookmarksAPI = require('./bg/bookmarks')
@@ -89,6 +91,7 @@ exports.setup = function () {
 
   // external apis
   globals.rpcAPI.exportAPI('navigator', navigatorManifest, navigatorAPI, secureOnly)
+  globals.rpcAPI.exportAPI('navigator-session', navigatorSessionManifest, navigatorSessionAPI, secureOnly)
   globals.rpcAPI.exportAPI('dat-archive', datArchiveManifest, datArchiveAPI, secureOnly)
   globals.rpcAPI.exportAPI('spell-checker', spellCheckerManifest, spellCheckerAPI)
   globals.rpcAPI.exportAPI('bookmarks', bookmarksManifest, bookmarksAPI, secureOnly)
diff --git a/web-apis/bg/applications.js b/web-apis/bg/applications.js
index 238700a0..108e2b29 100644
--- a/web-apis/bg/applications.js
+++ b/web-apis/bg/applications.js
@@ -1,6 +1,6 @@
 const globals = require('../../globals')
 const dat = require('../../dat')
-const appPerms = require('../../lib/app-perms')
+const sessionPerms = require('../../lib/session-perms')
 const sitedataDb = require('../../dbs/sitedata')
 const knex = require('../../lib/knex')
 const db = require('../../dbs/profile-data-db')
@@ -36,7 +36,7 @@ module.exports = {
    */
   async getInfo (url) {
     url = toDatOrigin(url)
-    var userId = await appPerms.getSessionUserId(this.sender)
+    var userId = await sessionPerms.getSessionUserId(this.sender)
     var record = await db.get(knex('installed_applications').where({userId, url}))
     var archiveInfo = await dat.library.getArchiveInfo(url)
     return massageArchiveInfo(archiveInfo, record)
@@ -48,7 +48,7 @@ module.exports = {
    */
   async install (url) {
     url = toDatOrigin(url)
-    var userId = await appPerms.getSessionUserId(this.sender)
+    var userId = await sessionPerms.getSessionUserId(this.sender)
     var archiveInfo = await dat.library.getArchiveInfo(url)
     var record = await db.get(knex('installed_applications').where({userId, url}))
     if (!record) {
@@ -59,7 +59,7 @@ module.exports = {
         createdAt: Date.now()
       }))
     }
-    await sitedataDb.setAppPermissions(url, getArchivePerms(archiveInfo))
+    // await sitedataDb.setAppPermissions(url, getArchivePerms(archiveInfo)) DEPRECATED
   },
 
   /**
@@ -80,13 +80,13 @@ module.exports = {
    * @returns {Promise<WebAPIApplication[]>}
    */
   async list () {
-    var userId = await appPerms.getSessionUserId(this.sender)
+    var userId = await sessionPerms.getSessionUserId(this.sender)
     var records = await db.all(knex('installed_applications').where({userId}))
     await Promise.all(records.map(async (record) => {
       var archiveInfo = await dat.library.getArchiveInfo(record.url)
       record.title = archiveInfo.title
       record.description = archiveInfo.description
-      record.permissions = await sitedataDb.getAppPermissions(record.url)
+      // record.permissions = await sitedataDb.getAppPermissions(record.url) DEPRECATED
     }))
     return records.map(massageAppRecord)
   },
@@ -97,7 +97,7 @@ module.exports = {
    */
   async enable (url) {
     url = toDatOrigin(url)
-    var userId = await appPerms.getSessionUserId(this.sender)
+    var userId = await sessionPerms.getSessionUserId(this.sender)
     await db.run(knex('installed_applications').update({enabled: 1}).where({userId, url}))
   },
 
@@ -107,7 +107,7 @@ module.exports = {
    */
   async disable (url) {
     url = toDatOrigin(url)
-    var userId = await appPerms.getSessionUserId(this.sender)
+    var userId = await sessionPerms.getSessionUserId(this.sender)
     await db.run(knex('installed_applications').update({enabled: 0}).where({userId, url}))
   },
 
@@ -117,8 +117,8 @@ module.exports = {
    */
   async uninstall (url) {
     url = toDatOrigin(url)
-    var userId = await appPerms.getSessionUserId(this.sender)
-    await sitedataDb.setAppPermissions(url, {})
+    var userId = await sessionPerms.getSessionUserId(this.sender)
+    // await sitedataDb.setAppPermissions(url, {}) DEPRECATED
     await db.run(knex('installed_applications').delete().where({userId, url}))
   }
 }
@@ -157,7 +157,7 @@ function massageArchiveInfo (archiveInfo, record) {
     permissions: Object.entries(getArchivePerms(archiveInfo)).map(([id, caps]) => ({
       id,
       caps,
-      description: appPerms.describePerm(id, caps)
+      description: sessionPerms.describePerm(id, caps)
     })),
     installed: !!record,
     enabled: Boolean(record && record.enabled),
@@ -177,7 +177,7 @@ function massageAppRecord (record) {
     permissions: Object.entries(record.permissions).map(([id, caps]) => ({
       id,
       caps,
-      description: appPerms.describePerm(id, caps)
+      description: sessionPerms.describePerm(id, caps)
     })),
     installed: true,
     enabled: Boolean(record.enabled),
diff --git a/web-apis/bg/bookmarks.js b/web-apis/bg/bookmarks.js
index 66f992b1..5ac751b7 100644
--- a/web-apis/bg/bookmarks.js
+++ b/web-apis/bg/bookmarks.js
@@ -4,7 +4,7 @@ const bookmarksCrawler = require('../../crawler/bookmarks')
 const siteDescriptions = require('../../crawler/site-descriptions')
 const {toOrigin} = require('../../crawler/util')
 const _get = require('lodash.get')
-const appPerms = require('../../lib/app-perms')
+const sessionPerms = require('../../lib/session-perms')
 
 // typedefs
 // =
@@ -49,7 +49,7 @@ module.exports = {
    * @returns {Promise<BookmarkPublicAPIRecord[]>}
    */
   async query (opts) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/bookmarks', 'read')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/bookmarks', 'read')
 
     // NOTE
     // The crawled and local-user bookmarks are stored in separate tables
@@ -135,7 +135,7 @@ module.exports = {
    * @returns {Promise<string[]>}
    */
   async listTags () {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/bookmarks', 'read')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/bookmarks', 'read')
     return bookmarksDb.listBookmarkTags(0)
   },
 
@@ -144,7 +144,7 @@ module.exports = {
    * @returns {Promise<BookmarkPublicAPIRecord>}
    */
   async get (href) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/bookmarks', 'read')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/bookmarks', 'read')
 
     // fetch user
     var userSession = globals.userSessionAPI.getFor(this.sender)
@@ -160,7 +160,7 @@ module.exports = {
    * @returns {Promise<boolean>}
    */
   async has (href) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/bookmarks', 'read')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/bookmarks', 'read')
     try {
       var bookmark = await bookmarksDb.getBookmark(0, href)
       return !!bookmark
@@ -180,7 +180,7 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async add (data) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/bookmarks', 'write')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/bookmarks', 'write')
     await bookmarksDb.addBookmark(0, data)
   },
 
@@ -196,7 +196,7 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async edit (href, data = {}) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/bookmarks', 'write')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/bookmarks', 'write')
     await bookmarksDb.editBookmark(0, href, data)
   },
 
@@ -205,7 +205,7 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async remove (href) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/bookmarks', 'write')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/bookmarks', 'write')
     await bookmarksDb.removeBookmark(0, href)
   },
 
@@ -215,7 +215,7 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async configure (opts) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/bookmarks', 'write')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/bookmarks', 'write')
     if (opts.pins) {
       if (!Array.isArray(opts.pins)) throw new Error('.pins must be an array of URLs')
       await bookmarksDb.setBookmarkPinOrder(0, opts.pins)
diff --git a/web-apis/bg/navigator-session.js b/web-apis/bg/navigator-session.js
new file mode 100644
index 00000000..bf5e0918
--- /dev/null
+++ b/web-apis/bg/navigator-session.js
@@ -0,0 +1,123 @@
+const globals = require('../../globals')
+const assert = require('assert')
+const { UserDeniedError } = require('beaker-error-constants')
+const users = require('../../users')
+const userSiteSessions = require('../../users/site-sessions')
+const sessionPerms = require('../../lib/session-perms')
+
+// typedefs
+// =
+
+/**
+ * @typedef {import('../../users/index').User} User
+ * @typedef {import('../../users/site-sessions').UserSiteSession} UserSiteSession
+ * 
+ * @typedef {Object} NavigatorSessionPublicAPIRecord
+ * @prop {Object} profile
+ * @prop {string} profile.url
+ * @prop {string} profile.title
+ * @prop {string} profile.description
+ * @prop {Object} permissions
+ */
+
+// exported api
+// =
+
+module.exports = {
+  /**
+   * @param {Object} [opts]
+   * @param {Object} [opts.permissions]
+   * @returns {Promise<NavigatorSessionPublicAPIRecord>}
+   */
+  async request (opts = {}) {
+    if (typeof opts !== 'object') {
+      throw new Error('First argument must be an object')
+    }
+    var user = await getUser(this.sender)
+    var siteUrl = await sessionPerms.toDatOrigin(this.sender.getURL())
+
+    // prep the perms
+    opts.permissions = opts.permissions || {}
+    sessionPerms.normalizePerms(opts.permissions)
+    var permissions = Object.entries(opts.permissions).map(([id, caps]) => ({
+      id,
+      caps,
+      icon: sessionPerms.getPermIcon(id),
+      description: sessionPerms.describePerm(id, caps)
+    }))
+
+    // put the perms in a user-friendly ordering
+    var permsOrder = [
+      'unwalled.garden/api/follows',
+      'unwalled.garden/api/posts',
+      'unwalled.garden/api/bookmarks',
+      'unwalled.garden/api/comments',
+      'unwalled.garden/api/reactions',
+      'unwalled.garden/api/votes'
+    ]
+    permissions.sort((a, b) => permsOrder.indexOf(a.id) - permsOrder.indexOf(b.id))
+
+    // run the modal
+    try {
+      await globals.uiAPI.showModal(this.sender, 'create-user-session', {
+        site: {
+          url: siteUrl,
+        },
+        user: {
+          url: user.url,
+          title: user.title
+        },
+        permissions
+      })
+    } catch (e) {
+      throw new UserDeniedError()
+    }
+
+    // create the session
+    return massageSessionRecord(user, await userSiteSessions.create(user.id, siteUrl, opts.permissions))
+  },
+
+  /**
+   * @returns {Promise<NavigatorSessionPublicAPIRecord>}
+   */
+  async get () {
+    var user = await getUser(this.sender)
+    var siteUrl = await sessionPerms.toDatOrigin(this.sender.getURL())
+    return massageSessionRecord(user, await userSiteSessions.get(user.id, siteUrl))
+  },
+
+  /**
+   * @returns {Promise<void>}
+   */
+  async destroy () {
+    var user = await getUser(this.sender)
+    var siteUrl = await sessionPerms.toDatOrigin(this.sender.getURL())
+    await userSiteSessions.destroy(user.id, siteUrl)
+  }
+}
+
+// internal methods
+// =
+
+async function getUser (sender) {
+  var userSession = globals.userSessionAPI.getFor(sender)
+  if (!userSession) throw new Error('No active user session')
+  return users.get(userSession.url)
+}
+
+/**
+ * @param {User} user
+ * @param {UserSiteSession} record
+ * @returns {NavigatorSessionPublicAPIRecord}
+ */
+function massageSessionRecord (user, record) {
+  if (!record) return null
+  return {
+    profile: {
+      url: user.url,
+      title: user.title,
+      description: user.description
+    },
+    permissions: record.permissions
+  }
+}
\ No newline at end of file
diff --git a/web-apis/bg/navigator.js b/web-apis/bg/navigator.js
index 71c5886c..5873a897 100644
--- a/web-apis/bg/navigator.js
+++ b/web-apis/bg/navigator.js
@@ -1,7 +1,7 @@
 const globals = require('../../globals')
 const assert = require('assert')
 const { UserDeniedError } = require('beaker-error-constants')
-const appPerms = require('../../lib/app-perms')
+const sessionPerms = require('../../lib/session-perms')
 const applications = require('../../applications')
 
 // typedefs
@@ -154,7 +154,7 @@ module.exports = {
    */
   // DISABLED
   // async getApplicationState () {
-  //   var userId = await appPerms.getSessionUserId(this.sender)
+  //   var userId = await sessionPerms.getSessionUserId(this.sender)
   //   return applications.getApplicationState({url: this.sender.getURL(), userId})
   // }
 }
diff --git a/web-apis/bg/unwalled-garden-comments.js b/web-apis/bg/unwalled-garden-comments.js
index 8e09cbc1..d91590ff 100644
--- a/web-apis/bg/unwalled-garden-comments.js
+++ b/web-apis/bg/unwalled-garden-comments.js
@@ -3,7 +3,7 @@ const assert = require('assert')
 const {URL} = require('url')
 const dat = require('../../dat')
 const commentsCrawler = require('../../crawler/comments')
-const appPerms = require('../../lib/app-perms')
+const sessionPerms = require('../../lib/session-perms')
 
 // typedefs
 // =
@@ -55,7 +55,7 @@ module.exports = {
    * @returns {Promise<CommentPublicAPIRecord[]>}
    */
   async list (opts) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/comments', 'read')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/comments', 'read')
     opts = (opts && typeof opts === 'object') ? opts : {}
     if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
@@ -98,7 +98,7 @@ module.exports = {
    * @returns {Promise<CommentPublicAPIRecord[]>}
    */
   async thread (topic, opts) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/comments', 'read')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/comments', 'read')
     opts = (opts && typeof opts === 'object') ? opts : {}
     assert(topic && typeof topic === 'string', 'The `topic` parameter must be a URL string')
     if (opts && 'parent' in opts) assert(typeof opts.parent === 'string', 'Parent must be a string')
@@ -127,7 +127,7 @@ module.exports = {
    * @returns {Promise<CommentPublicAPIRecord>}
    */
   async get (url) {
-    await appPerms.assertCan(this.sender, 'read', 'data:unwalled.garden:comments')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/comments', 'read')
     return massageCommentRecord(await commentsCrawler.get(url))
   },
 
@@ -140,8 +140,8 @@ module.exports = {
    * @returns {Promise<CommentPublicAPIRecord>}
    */
   async add (topic, comment) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/comments', 'write')
-    var userArchive = await appPerms.getSessionUserArchive(this.sender)
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/comments', 'write')
+    var userArchive = await sessionPerms.getSessionUserArchive(this.sender)
 
     // string usage
     if (typeof comment === 'string') {
@@ -172,8 +172,8 @@ module.exports = {
    * @returns {Promise<CommentPublicAPIRecord>}
    */
   async edit (url, comment) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/comments', 'write')
-    var userArchive = await appPerms.getSessionUserArchive(this.sender)
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/comments', 'write')
+    var userArchive = await sessionPerms.getSessionUserArchive(this.sender)
 
     // string usage
     if (typeof comment === 'string') {
@@ -196,8 +196,8 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async remove (url) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/comments', 'write')
-    var userArchive = await appPerms.getSessionUserArchive(this.sender)
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/comments', 'write')
+    var userArchive = await sessionPerms.getSessionUserArchive(this.sender)
 
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
 
diff --git a/web-apis/bg/unwalled-garden-discussions.js b/web-apis/bg/unwalled-garden-discussions.js
index 9e6f5dd3..52868c5f 100644
--- a/web-apis/bg/unwalled-garden-discussions.js
+++ b/web-apis/bg/unwalled-garden-discussions.js
@@ -3,7 +3,7 @@ const assert = require('assert')
 const {URL} = require('url')
 const dat = require('../../dat')
 const discussionsCrawler = require('../../crawler/discussions')
-const appPerms = require('../../lib/app-perms')
+const sessionPerms = require('../../lib/session-perms')
 
 // typedefs
 // =
@@ -44,7 +44,7 @@ module.exports = {
    * @returns {Promise<DiscussionPublicAPIRecord[]>}
    */
   async list (opts) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/discussions', 'read')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/discussions', 'read')
     opts = (opts && typeof opts === 'object') ? opts : {}
     if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
@@ -78,7 +78,7 @@ module.exports = {
    * @returns {Promise<DiscussionPublicAPIRecord>}
    */
   async get (url) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/discussions', 'read')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/discussions', 'read')
     return massageDiscussionRecord(await discussionsCrawler.get(url))
   },
 
@@ -92,8 +92,8 @@ module.exports = {
    * @returns {Promise<DiscussionPublicAPIRecord>}
    */
   async add (discussion) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/discussions', 'write')
-    var userArchive = await appPerms.getSessionUserArchive(this.sender)
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/discussions', 'write')
+    var userArchive = await sessionPerms.getSessionUserArchive(this.sender)
 
     assert(discussion && typeof discussion === 'object', 'The `discussion` parameter must be a string or object')
     assert(discussion.title && typeof discussion.title === 'string', 'The `discussion.title` parameter must be a non-empty string')
@@ -122,8 +122,8 @@ module.exports = {
    * @returns {Promise<DiscussionPublicAPIRecord>}
    */
   async edit (url, discussion) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/discussions', 'write')
-    var userArchive = await appPerms.getSessionUserArchive(this.sender)
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/discussions', 'write')
+    var userArchive = await sessionPerms.getSessionUserArchive(this.sender)
 
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
     assert(discussion && typeof discussion === 'object', 'The `discussion` parameter must be an object')
@@ -143,8 +143,8 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async remove (url) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/discussions', 'write')
-    var userArchive = await appPerms.getSessionUserArchive(this.sender)
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/discussions', 'write')
+    var userArchive = await sessionPerms.getSessionUserArchive(this.sender)
 
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
 
diff --git a/web-apis/bg/unwalled-garden-follows.js b/web-apis/bg/unwalled-garden-follows.js
index bea11620..a7c36ca0 100644
--- a/web-apis/bg/unwalled-garden-follows.js
+++ b/web-apis/bg/unwalled-garden-follows.js
@@ -3,7 +3,7 @@ const assert = require('assert')
 const {URL} = require('url')
 const dat = require('../../dat')
 const followsCrawler = require('../../crawler/follows')
-const appPerms = require('../../lib/app-perms')
+const sessionPerms = require('../../lib/session-perms')
 
 // typedefs
 // =
@@ -38,7 +38,7 @@ module.exports = {
    * @returns {Promise<FollowsPublicAPIRecord[]>}
    */
   async list (opts) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/follows', 'read')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/follows', 'read')
     opts = (opts && typeof opts === 'object') ? opts : {}
     if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
@@ -73,7 +73,7 @@ module.exports = {
    * @returns {Promise<FollowsPublicAPIRecord>}
    */
   async get (author, topic) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/follows', 'read')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/follows', 'read')
 
     author = normalizeFollowUrl(author)
     topic = normalizeFollowUrl(topic)
@@ -91,8 +91,8 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async add (topic, opts) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/follows', 'write')
-    var userArchive = await appPerms.getSessionUserArchive(this.sender)
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/follows', 'write')
+    var userArchive = await sessionPerms.getSessionUserArchive(this.sender)
 
     topic = normalizeFollowUrl(topic)
     if (!opts) opts = {}
@@ -110,8 +110,8 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async edit (topic, opts) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/follows', 'write')
-    var userArchive = await appPerms.getSessionUserArchive(this.sender)
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/follows', 'write')
+    var userArchive = await sessionPerms.getSessionUserArchive(this.sender)
 
     topic = normalizeFollowUrl(topic)
     if (!opts) opts = {}
@@ -127,8 +127,8 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async remove (topic) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/follows', 'write')
-    var userArchive = await appPerms.getSessionUserArchive(this.sender)
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/follows', 'write')
+    var userArchive = await sessionPerms.getSessionUserArchive(this.sender)
 
     topic = normalizeFollowUrl(topic)
     assert(topic, 'The `topic` parameter must be a valid URL')
diff --git a/web-apis/bg/unwalled-garden-media.js b/web-apis/bg/unwalled-garden-media.js
index 8a750d03..5ee72ef2 100644
--- a/web-apis/bg/unwalled-garden-media.js
+++ b/web-apis/bg/unwalled-garden-media.js
@@ -3,7 +3,7 @@ const assert = require('assert')
 const {URL} = require('url')
 const dat = require('../../dat')
 const mediaCrawler = require('../../crawler/media')
-const appPerms = require('../../lib/app-perms')
+const sessionPerms = require('../../lib/session-perms')
 
 // typedefs
 // =
@@ -47,7 +47,7 @@ module.exports = {
    * @returns {Promise<MediaPublicAPIRecord[]>}
    */
   async list (opts) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/media', 'read')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/media', 'read')
     opts = (opts && typeof opts === 'object') ? opts : {}
     if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
@@ -95,7 +95,7 @@ module.exports = {
    * @returns {Promise<MediaPublicAPIRecord>}
    */
   async get (url) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/media', 'read')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/media', 'read')
     return massageMediaRecord(await mediaCrawler.get(url))
   },
 
@@ -110,8 +110,8 @@ module.exports = {
    * @returns {Promise<MediaPublicAPIRecord>}
    */
   async add (media) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/media', 'write')
-    var userArchive = await appPerms.getSessionUserArchive(this.sender)
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/media', 'write')
+    var userArchive = await sessionPerms.getSessionUserArchive(this.sender)
 
     assert(media && typeof media === 'object', 'The `media` parameter must be a string or object')
     assert(media.subtype && typeof media.subtype === 'string', 'The `media.subtype` parameter must be a non-empty URL string')
@@ -142,8 +142,8 @@ module.exports = {
    * @returns {Promise<MediaPublicAPIRecord>}
    */
   async edit (url, media) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/media', 'write')
-    var userArchive = await appPerms.getSessionUserArchive(this.sender)
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/media', 'write')
+    var userArchive = await sessionPerms.getSessionUserArchive(this.sender)
 
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
     assert(media && typeof media === 'object', 'The `media` parameter must be an object')
@@ -164,8 +164,8 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async remove (url) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/media', 'write')
-    var userArchive = await appPerms.getSessionUserArchive(this.sender)
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/media', 'write')
+    var userArchive = await sessionPerms.getSessionUserArchive(this.sender)
 
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
 
diff --git a/web-apis/bg/unwalled-garden-posts.js b/web-apis/bg/unwalled-garden-posts.js
index 7a886151..81e0e325 100644
--- a/web-apis/bg/unwalled-garden-posts.js
+++ b/web-apis/bg/unwalled-garden-posts.js
@@ -3,7 +3,7 @@ const assert = require('assert')
 const {URL} = require('url')
 const dat = require('../../dat')
 const postsCrawler = require('../../crawler/posts')
-const appPerms = require('../../lib/app-perms')
+const sessionPerms = require('../../lib/session-perms')
 
 // typedefs
 // =
@@ -40,7 +40,7 @@ module.exports = {
    * @returns {Promise<PostPublicAPIRecord[]>}
    */
   async list (opts) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/posts', 'read')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/posts', 'read')
     opts = (opts && typeof opts === 'object') ? opts : {}
     if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
@@ -67,7 +67,7 @@ module.exports = {
    * @returns {Promise<PostPublicAPIRecord>}
    */
   async get (url) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/posts', 'read')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/posts', 'read')
     return massagePostRecord(await postsCrawler.get(url))
   },
 
@@ -78,8 +78,8 @@ module.exports = {
    * @returns {Promise<PostPublicAPIRecord>}
    */
   async add (post) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/posts', 'write')
-    var userArchive = await appPerms.getSessionUserArchive(this.sender)
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/posts', 'write')
+    var userArchive = await sessionPerms.getSessionUserArchive(this.sender)
 
     // string usage
     if (typeof post === 'string') {
@@ -107,8 +107,8 @@ module.exports = {
    * @returns {Promise<PostPublicAPIRecord>}
    */
   async edit (url, post) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/posts', 'write')
-    var userArchive = await appPerms.getSessionUserArchive(this.sender)
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/posts', 'write')
+    var userArchive = await sessionPerms.getSessionUserArchive(this.sender)
 
     // string usage
     if (typeof post === 'string') {
@@ -130,8 +130,8 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async remove (url) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/posts', 'write')
-    var userArchive = await appPerms.getSessionUserArchive(this.sender)
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/posts', 'write')
+    var userArchive = await sessionPerms.getSessionUserArchive(this.sender)
 
     assert(url && typeof url === 'string', 'The `url` parameter must be a valid URL')
 
diff --git a/web-apis/bg/unwalled-garden-profiles.js b/web-apis/bg/unwalled-garden-profiles.js
index 8bad58d6..87a3002b 100644
--- a/web-apis/bg/unwalled-garden-profiles.js
+++ b/web-apis/bg/unwalled-garden-profiles.js
@@ -1,7 +1,7 @@
 const globals = require('../../globals')
 const datLibrary = require('../../dat/library')
 const crawler = require('../../crawler')
-const appPerms = require('../../lib/app-perms')
+const sessionPerms = require('../../lib/session-perms')
 
 // typedefs
 // =
@@ -36,7 +36,7 @@ module.exports = {
    * @returns {Promise<ProfilesPublicAPIRecord>}
    */
   async me () {
-    await appPerms.assertInstalled(this.sender)
+    await sessionPerms.getSessionOrThrow(this.sender)
     var sess = globals.userSessionAPI.getFor(this.sender)
     if (!sess) return null
     return get(sess.url)
@@ -47,7 +47,7 @@ module.exports = {
    * @returns {Promise<ProfilesPublicAPIRecord>}
    */
   async get (url) {
-    await appPerms.assertInstalled(this.sender)
+    await sessionPerms.getSessionOrThrow(this.sender)
     return get(url)
   },
 
@@ -56,7 +56,7 @@ module.exports = {
    * @returns {Promise<ProfilesPublicAPIRecord>}
    */
   async index (url) {
-    await appPerms.assertInstalled(this.sender)
+    await sessionPerms.getSessionOrThrow(this.sender)
     await crawler.crawlSite(url)
     return get(url)
   }
diff --git a/web-apis/bg/unwalled-garden-reactions.js b/web-apis/bg/unwalled-garden-reactions.js
index 703956c2..23c8a358 100644
--- a/web-apis/bg/unwalled-garden-reactions.js
+++ b/web-apis/bg/unwalled-garden-reactions.js
@@ -4,7 +4,7 @@ const {URL} = require('url')
 const dat = require('../../dat')
 const reactionsCrawler = require('../../crawler/reactions')
 const siteDescriptionsCrawler = require('../../crawler/site-descriptions')
-const appPerms = require('../../lib/app-perms')
+const sessionPerms = require('../../lib/session-perms')
 
 // typedefs
 // =
@@ -48,7 +48,7 @@ module.exports = {
    * @returns {Promise<ReactionPublicAPIRecord[]>}
    */
   async list (opts) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/reactions', 'read')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/reactions', 'read')
     opts = (opts && typeof opts === 'object') ? opts : {}
     if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
@@ -85,7 +85,7 @@ module.exports = {
    * @returns {Promise<TopicReactionsPublicAPIRecord[]>}
    */
   async tabulate (topic, opts) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/reactions', 'read')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/reactions', 'read')
     topic = normalizeTopicUrl(topic)
     assert(topic && typeof topic === 'string', 'The `topic` parameter must be a valid URL')
     opts = (opts && typeof opts === 'object') ? opts : {}
@@ -124,8 +124,8 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async add (topic, emoji) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/reactions', 'write')
-    var userArchive = await appPerms.getSessionUserArchive(this.sender)
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/reactions', 'write')
+    var userArchive = await sessionPerms.getSessionUserArchive(this.sender)
 
     topic = normalizeTopicUrl(topic)
     assert(topic && typeof topic === 'string', 'The `topic` parameter must be a valid URL')
@@ -139,8 +139,8 @@ module.exports = {
    * @returns {Promise<void>}
    */
   async remove (topic, emoji) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/reactions', 'write')
-    var userArchive = await appPerms.getSessionUserArchive(this.sender)
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/reactions', 'write')
+    var userArchive = await sessionPerms.getSessionUserArchive(this.sender)
 
     topic = normalizeTopicUrl(topic)
     assert(topic && typeof topic === 'string', 'The `topic` parameter must be a valid URL')
diff --git a/web-apis/bg/unwalled-garden-tags.js b/web-apis/bg/unwalled-garden-tags.js
index 41b8b819..b1ab5781 100644
--- a/web-apis/bg/unwalled-garden-tags.js
+++ b/web-apis/bg/unwalled-garden-tags.js
@@ -1,7 +1,7 @@
 const globals = require('../../globals')
 const assert = require('assert')
 const tagsCrawler = require('../../crawler/tags')
-const appPerms = require('../../lib/app-perms')
+const sessionPerms = require('../../lib/session-perms')
 
 // typedefs
 // =
@@ -30,7 +30,7 @@ module.exports = {
    * @returns {Promise<TagPublicAPIRecord[]>}
    */
   async listBookmarkTags (opts) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/bookmarks', 'read')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/bookmarks', 'read')
     opts = (opts && typeof opts === 'object') ? opts : {}
     if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
@@ -64,7 +64,7 @@ module.exports = {
    * @returns {Promise<TagPublicAPIRecord[]>}
    */
   async listDiscussionTags (opts) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/discussions', 'read')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/discussions', 'read')
     opts = (opts && typeof opts === 'object') ? opts : {}
     if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
@@ -99,7 +99,7 @@ module.exports = {
    * @returns {Promise<TagPublicAPIRecord[]>}
    */
   async listMediaTags (opts) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/media', 'read')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/media', 'read')
     opts = (opts && typeof opts === 'object') ? opts : {}
     if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
diff --git a/web-apis/bg/unwalled-garden-votes.js b/web-apis/bg/unwalled-garden-votes.js
index 571c4e5c..3634f0b8 100644
--- a/web-apis/bg/unwalled-garden-votes.js
+++ b/web-apis/bg/unwalled-garden-votes.js
@@ -3,7 +3,7 @@ const assert = require('assert')
 const {URL} = require('url')
 const dat = require('../../dat')
 const votesCrawler = require('../../crawler/votes')
-const appPerms = require('../../lib/app-perms')
+const sessionPerms = require('../../lib/session-perms')
 
 // typedefs
 // =
@@ -52,7 +52,7 @@ module.exports = {
    * @returns {Promise<VotePublicAPIRecord[]>}
    */
   async list (opts) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/votes', 'read')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/votes', 'read')
     opts = (opts && typeof opts === 'object') ? opts : {}
     if (opts && 'sortBy' in opts) assert(typeof opts.sortBy === 'string', 'SortBy must be a string')
     if (opts && 'offset' in opts) assert(typeof opts.offset === 'number', 'Offset must be a number')
@@ -89,7 +89,7 @@ module.exports = {
    * @returns {Promise<TabulatedVotesPublicAPIRecord>}
    */
   async tabulate (topic, opts) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/votes', 'read')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/votes', 'read')
     topic = normalizeTopicUrl(topic)
     assert(topic && typeof topic === 'string', 'The `topic` parameter must be a valid URL')
     opts = (opts && typeof opts === 'object') ? opts : {}
@@ -132,7 +132,7 @@ module.exports = {
    * @returns {Promise<VotePublicAPIRecord>}
    */
   async get (author, topic) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/votes', 'read')
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/votes', 'read')
     return massageVoteRecord(await votesCrawler.get(author, topic))
   },
 
@@ -142,8 +142,8 @@ module.exports = {
    * @returns {Promise<VotePublicAPIRecord>}
    */
   async set (topic, vote) {
-    await appPerms.assertCan(this.sender, 'unwalled.garden/perm/votes', 'write')
-    var userArchive = await appPerms.getSessionUserArchive(this.sender)
+    await sessionPerms.assertCan(this.sender, 'unwalled.garden/api/votes', 'write')
+    var userArchive = await sessionPerms.getSessionUserArchive(this.sender)
 
     topic = normalizeTopicUrl(topic)
     assert(topic && typeof topic === 'string', 'The `topic` parameter must be a valid URL')
diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index 80f46155..4ad82454 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -149,11 +149,8 @@ exports.setup = function (rpc) {
     beaker.sitedata.get = sitedataRPC.get
     beaker.sitedata.set = sitedataRPC.set
     beaker.sitedata.getPermissions = sitedataRPC.getPermissions
-    beaker.sitedata.getAppPermissions = sitedataRPC.getAppPermissions
-    beaker.sitedata.getAppPermission = sitedataRPC.getAppPermission
     beaker.sitedata.getPermission = sitedataRPC.getPermission
     beaker.sitedata.setPermission = sitedataRPC.setPermission
-    beaker.sitedata.setAppPermissions = sitedataRPC.setAppPermissions
     beaker.sitedata.clearPermission = sitedataRPC.clearPermission
     beaker.sitedata.clearPermissionAllOrigins = sitedataRPC.clearPermissionAllOrigins
 
diff --git a/web-apis/fg/navigator-methods.js b/web-apis/fg/navigator-methods.js
index 2242c7f7..374c2adf 100644
--- a/web-apis/fg/navigator-methods.js
+++ b/web-apis/fg/navigator-methods.js
@@ -1,11 +1,22 @@
 const errors = require('beaker-error-constants')
 const manifest = require('../manifests/external/navigator')
+const sessionManifest = require('../manifests/external/navigator-session')
 
 const RPC_OPTS = { timeout: false, errors }
 
 exports.setup = function (rpc) {
   var api = rpc.importAPI('navigator', manifest, RPC_OPTS)
   for (let k in manifest) {
-    navigator[k] = api[k].bind(api)
+    if (typeof api[k] === 'function') {
+      navigator[k] = api[k].bind(api)
+    }
+  }
+
+  navigator.session = {}
+  var sessionApi = rpc.importAPI('navigator-session', sessionManifest, RPC_OPTS)
+  for (let k in sessionManifest) {
+    if (typeof sessionApi[k] === 'function') {
+      navigator.session[k] = sessionApi[k].bind(sessionApi)
+    }
   }
 }
diff --git a/web-apis/manifests/external/navigator-session.js b/web-apis/manifests/external/navigator-session.js
new file mode 100644
index 00000000..4b235723
--- /dev/null
+++ b/web-apis/manifests/external/navigator-session.js
@@ -0,0 +1,5 @@
+module.exports = {
+  request: 'promise',
+  get: 'promise',
+  destroy: 'promise'
+}
\ No newline at end of file
diff --git a/web-apis/manifests/internal/sitedata.js b/web-apis/manifests/internal/sitedata.js
index 6a13375e..cc64260a 100644
--- a/web-apis/manifests/internal/sitedata.js
+++ b/web-apis/manifests/internal/sitedata.js
@@ -3,10 +3,7 @@ module.exports = {
   set: 'promise',
   getPermissions: 'promise',
   getPermission: 'promise',
-  getAppPermissions: 'promise',
-  getAppPermission: 'promise',
   setPermission: 'promise',
-  setAppPermissions: 'promise',
   clearPermission: 'promise',
   clearPermissionAllOrigins: 'promise'
 }

From 19472982037918d2aeca6566450a2112b675a52d Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 8 Aug 2019 11:44:55 -0500
Subject: [PATCH 241/245] Change theme-serving to a simple js/css injection

---
 dat/protocol.js | 54 +++++++++++++++++++++++++++----------------------
 lib/markdown.js | 14 ++++++++++---
 2 files changed, 41 insertions(+), 27 deletions(-)

diff --git a/dat/protocol.js b/dat/protocol.js
index 432521ba..6de06db0 100644
--- a/dat/protocol.js
+++ b/dat/protocol.js
@@ -207,17 +207,19 @@ exports.electronHandler = async function (request, respond) {
   var entry = await datServeResolvePath(checkoutFS.pda, manifest, urlp, request.headers.Accept)
 
   // use theme template if it exists
+  var themeSettings = {
+    active: false,
+    js: false,
+    css: false
+  }
   if (!urlp.query.disable_theme) {
     if (entry && mime.acceptHeaderWantsHTML(request.headers.Accept) && ['.html', '.htm', '.md'].includes(extname(entry.path))) {
-      let template = await checkoutFS.pda.readFile('/theme/template.html', 'utf8').catch(err => null)
-      if (template) {
-        return respond({
-          statusCode: 200,
-          headers: Object.assign(headers, {
-            'Content-Type': 'text/html'
-          }),
-          data: intoStream(template)
-        })
+      let exists = async (path) => await checkoutFS.pda.stat(path).then(() => true, () => false)
+      let [js, css] = await Promise.all([exists('/theme/index.js'), exists('/theme/index.css')])
+      if (js || css) {
+        themeSettings.active = true
+        themeSettings.css = css
+        themeSettings.js = js
       }
     }
   }
@@ -237,20 +239,8 @@ exports.electronHandler = async function (request, respond) {
       })
     }
 
-    let headers = {
-      'Content-Type': 'text/html',
-      'Content-Security-Policy': cspHeader,
-      'Access-Control-Allow-Origin': '*'
-    }
-    if (request.method === 'HEAD') {
-      return respond({statusCode: 204, headers, data: intoStream('')})
-    } else {
-      return respond({
-        statusCode: 200,
-        headers,
-        data: intoStream(await directoryListingPage(checkoutFS, filepath, manifest && manifest.web_root))
-      })
-    }
+    // 404
+    entry = null
   }
 
   // handle not found
@@ -311,7 +301,23 @@ exports.electronHandler = async function (request, respond) {
       headers: Object.assign(headers, {
         'Content-Type': 'text/html'
       }),
-      data: intoStream(markdown.render(content))
+      data: intoStream(markdown.render(content, themeSettings))
+    })
+  }
+
+  // theme wrapping
+  if (themeSettings.active) {
+    let html = await checkoutFS.pda.readFile(entry.path, 'utf8')
+    html = `
+${themeSettings.js ? `<script type="module" src="/theme/index.js"></script>` : ''}
+${themeSettings.css ? `<link rel="stylesheet" href="/theme/index.css">` : ''}
+${html}`
+    return respond({
+      statusCode: 200,
+      headers: Object.assign(headers, {
+        'Content-Type': 'text/html'
+      }),
+      data: intoStream(html)
     })
   }
 
diff --git a/lib/markdown.js b/lib/markdown.js
index eef0d78f..6f6524c2 100644
--- a/lib/markdown.js
+++ b/lib/markdown.js
@@ -28,14 +28,22 @@ md.renderer.rules.heading_open = function (tokens, idx /*, options, env */) {
   return '<' + tokens[idx].tag + ' id="' + anchorMarkdownHeader(txt, numRepetitions[txt]) + '">'
 }
 
-exports.render = function (content) {
-  return `
+exports.render = function (content, themeSettings) {
+  var html = `
 <html>
   <body>
-    <main>${md.render(content)}</main>
+    ${md.render(content)}
   </body>
 </html>
   `
+  if (themeSettings.active) {
+    html = `
+${themeSettings.js ? `<script type="module" src="/theme/index.js"></script>` : ''}
+${themeSettings.css ? `<link rel="stylesheet" href="/theme/index.css">` : ''}
+${html}
+    `
+  }
+  return html
 }
 
 /**

From 53e039a4c86d2af6ff6cc8b9b5a693d17bbbfcec Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 8 Aug 2019 11:45:31 -0500
Subject: [PATCH 242/245] Add tools for sidebar fetching of site sessions

---
 users/site-sessions.js           |  6 +++---
 web-apis/bg/navigator-session.js | 24 +++++++++++++++++++-----
 2 files changed, 22 insertions(+), 8 deletions(-)

diff --git a/users/site-sessions.js b/users/site-sessions.js
index 7edef582..d240079e 100644
--- a/users/site-sessions.js
+++ b/users/site-sessions.js
@@ -77,8 +77,8 @@ exports.destroy = async function (userId, url) {
 // =
 
 /**
- * @param {number} userId 
- * @param {string} url 
+ * @param {number} userId
+ * @param {string} url
  * @returns {string}
  */
 function sesskey (userId, url) {
@@ -86,7 +86,7 @@ function sesskey (userId, url) {
 }
 
 /**
- * @param {Object} record 
+ * @param {Object} record
  * @returns {UserSiteSession}
  */
 function massageRecord (record) {
diff --git a/web-apis/bg/navigator-session.js b/web-apis/bg/navigator-session.js
index bf5e0918..3c47b217 100644
--- a/web-apis/bg/navigator-session.js
+++ b/web-apis/bg/navigator-session.js
@@ -11,7 +11,7 @@ const sessionPerms = require('../../lib/session-perms')
 /**
  * @typedef {import('../../users/index').User} User
  * @typedef {import('../../users/site-sessions').UserSiteSession} UserSiteSession
- * 
+ *
  * @typedef {Object} NavigatorSessionPublicAPIRecord
  * @prop {Object} profile
  * @prop {string} profile.url
@@ -78,20 +78,34 @@ module.exports = {
   },
 
   /**
+   * @param {string} siteUrl only usable from beaker:// origins
    * @returns {Promise<NavigatorSessionPublicAPIRecord>}
    */
-  async get () {
+  async get (siteUrl = undefined) {
     var user = await getUser(this.sender)
-    var siteUrl = await sessionPerms.toDatOrigin(this.sender.getURL())
+    if (this.sender.getURL().startsWith('beaker:') && siteUrl) {
+      // trusted app, use given url
+      siteUrl = await sessionPerms.toDatOrigin(siteUrl)
+    } else {
+      // use sender url
+      siteUrl = await sessionPerms.toDatOrigin(this.sender.getURL())
+    }
     return massageSessionRecord(user, await userSiteSessions.get(user.id, siteUrl))
   },
 
   /**
+   * @param {string} siteUrl only usable from beaker:// origins
    * @returns {Promise<void>}
    */
-  async destroy () {
+  async destroy (siteUrl = undefined) {
     var user = await getUser(this.sender)
-    var siteUrl = await sessionPerms.toDatOrigin(this.sender.getURL())
+    if (this.sender.getURL().startsWith('beaker:') && siteUrl) {
+      // trusted app, use given url
+      siteUrl = await sessionPerms.toDatOrigin(siteUrl)
+    } else {
+      // use sender url
+      siteUrl = await sessionPerms.toDatOrigin(this.sender.getURL())
+    }
     await userSiteSessions.destroy(user.id, siteUrl)
   }
 }

From 7b8eb623b99f1f4d1d274bb9bf63184afbabd80e Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Sun, 11 Aug 2019 20:59:52 -0500
Subject: [PATCH 243/245] Add beaker.browser.openSidebar

---
 web-apis/fg/beaker.js                  | 1 +
 web-apis/manifests/internal/browser.js | 1 +
 2 files changed, 2 insertions(+)

diff --git a/web-apis/fg/beaker.js b/web-apis/fg/beaker.js
index 4ad82454..0c3e70b0 100644
--- a/web-apis/fg/beaker.js
+++ b/web-apis/fg/beaker.js
@@ -107,6 +107,7 @@ exports.setup = function (rpc) {
     beaker.browser.getBuiltinFavicon = beakerBrowserRPC.getBuiltinFavicon
     beaker.browser.uploadFavicon = beakerBrowserRPC.uploadFavicon
     beaker.browser.imageToIco = beakerBrowserRPC.imageToIco
+    beaker.browser.openSidebar = beakerBrowserRPC.openSidebar
     beaker.browser.toggleSidebar = beakerBrowserRPC.toggleSidebar
     beaker.browser.toggleLiveReloading = beakerBrowserRPC.toggleLiveReloading
     beaker.browser.setWindowDimensions = beakerBrowserRPC.setWindowDimensions
diff --git a/web-apis/manifests/internal/browser.js b/web-apis/manifests/internal/browser.js
index 402f2adb..93b83984 100644
--- a/web-apis/manifests/internal/browser.js
+++ b/web-apis/manifests/internal/browser.js
@@ -30,6 +30,7 @@ module.exports = {
 
   getResourceContentType: 'sync',
 
+  openSidebar: 'promise',
   toggleSidebar: 'promise',
   toggleLiveReloading: 'promise',
   setWindowDimensions: 'promise',

From 736072341fae5a833b471e3e3df18d551bd072b6 Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Tue, 13 Aug 2019 09:53:04 -0500
Subject: [PATCH 244/245] Allow writes via DatArchive to unsaved archives

---
 web-apis/bg/dat-archive.js | 5 -----
 1 file changed, 5 deletions(-)

diff --git a/web-apis/bg/dat-archive.js b/web-apis/bg/dat-archive.js
index 239066b2..a3aa0f8c 100644
--- a/web-apis/bg/dat-archive.js
+++ b/web-apis/bg/dat-archive.js
@@ -582,11 +582,6 @@ async function assertWritePermission (archive, sender) {
     throw new ArchiveNotWritableError()
   }
 
-  // ensure we havent deleted the archive
-  if (!details.userSettings.isSaved) {
-    throw new ArchiveNotWritableError('This archive has been deleted. Restore it to continue making changes.')
-  }
-
   // beaker: always allowed
   if (sender.getURL().startsWith('beaker:')) {
     return true

From 88f90186cac80c7643b70da26cd1b491db0ce5bd Mon Sep 17 00:00:00 2001
From: Paul Frazee <pfrazee@gmail.com>
Date: Thu, 15 Aug 2019 13:39:51 -0500
Subject: [PATCH 245/245] Bump package-lock.json

---
 package-lock.json | 103 ++++++++++++++++++++++++++++++++--------------
 1 file changed, 71 insertions(+), 32 deletions(-)

diff --git a/package-lock.json b/package-lock.json
index d891427f..195502a0 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -45,9 +45,9 @@
       "integrity": "sha512-6BmYWSBea18+tSjjSC3QIyV93ZKAeNWGM7R6aYt1ryTZXrlHF+QLV0G2yV0viEGVyRkyQsWfMoJ0k/YghBX5sQ=="
     },
     "@types/node": {
-      "version": "12.6.9",
-      "resolved": "https://registry.npmjs.org/@types/node/-/node-12.6.9.tgz",
-      "integrity": "sha512-+YB9FtyxXGyD54p8rXwWaN1EWEyar5L58GlGWgtH2I9rGmLGBQcw63+0jw+ujqVavNuO47S1ByAjm9zdHMnskw==",
+      "version": "12.7.1",
+      "resolved": "https://registry.npmjs.org/@types/node/-/node-12.7.1.tgz",
+      "integrity": "sha512-aK9jxMypeSrhiYofWWBf/T7O+KwaiAHzM4sveCdWPn71lzUSMimRnKzhXDKfKwV1kWoBo2P1aGgaIYGLf9/ljw==",
       "optional": true
     },
     "abbrev": {
@@ -606,6 +606,31 @@
       "resolved": "https://registry.npmjs.org/chownr/-/chownr-1.1.2.tgz",
       "integrity": "sha512-GkfeAQh+QNy3wquu9oIZr6SS5x7wGdSgNQvD10X3r+AZr1Oys22HW8kAmDMvNg2+Dm0TeGaEuO8gFwdBXxwO8A=="
     },
+    "chrome-dgram": {
+      "version": "3.0.2",
+      "resolved": "https://registry.npmjs.org/chrome-dgram/-/chrome-dgram-3.0.2.tgz",
+      "integrity": "sha512-Ay741EHF/Ib18un+LUtBNK43NrabD6GOuwVaka7uUbV0gFRLEPULm2Q05YSzRNBtSrbaO4eErmDdniiy/u8Lig==",
+      "requires": {
+        "inherits": "^2.0.1",
+        "run-series": "^1.1.2"
+      }
+    },
+    "chrome-dns": {
+      "version": "1.0.1",
+      "resolved": "https://registry.npmjs.org/chrome-dns/-/chrome-dns-1.0.1.tgz",
+      "integrity": "sha512-HqsYJgIc8ljJJOqOzLphjAs79EUuWSX3nzZi2LNkzlw3GIzAeZbaSektC8iT/tKvLqZq8yl1GJu5o6doA4TRbg==",
+      "requires": {
+        "chrome-net": "^3.3.2"
+      }
+    },
+    "chrome-net": {
+      "version": "3.3.2",
+      "resolved": "https://registry.npmjs.org/chrome-net/-/chrome-net-3.3.2.tgz",
+      "integrity": "sha512-BHxWfA9MDnh0C1By5q1DnF1vRS7vfBi2PrqTHIIt1HA4hM6l2xkHzoazbDlZcrDrMfjNs6fojKG+ZD0JmlnNWg==",
+      "requires": {
+        "inherits": "^2.0.1"
+      }
+    },
     "circular-append-file": {
       "version": "1.0.1",
       "resolved": "https://registry.npmjs.org/circular-append-file/-/circular-append-file-1.0.1.tgz",
@@ -1909,9 +1934,9 @@
       "dev": true
     },
     "graceful-fs": {
-      "version": "4.2.0",
-      "resolved": "https://registry.npmjs.org/graceful-fs/-/graceful-fs-4.2.0.tgz",
-      "integrity": "sha512-jpSvDPV4Cq/bgtpndIWbI5hmYxhQGHPC4d4cqBPb4DLniCfhJokdXhwhaDuLBGLQdvvRum/UiX6ECVIPvDXqdg=="
+      "version": "4.2.1",
+      "resolved": "https://registry.npmjs.org/graceful-fs/-/graceful-fs-4.2.1.tgz",
+      "integrity": "sha512-b9usnbDGnD928gJB3LrCmxoibr3VE4U2SMo5PBuBnokWyDADTqDPXg4YpwKF1trpH+UbGp7QLicO3+aWEy0+mw=="
     },
     "har-schema": {
       "version": "2.0.0",
@@ -1995,9 +2020,9 @@
       }
     },
     "hypercore": {
-      "version": "7.5.1",
-      "resolved": "https://registry.npmjs.org/hypercore/-/hypercore-7.5.1.tgz",
-      "integrity": "sha512-tgololYj3O6Y0Mg6PK7EJntRu+auKSYuER2a8pVetPqnDSJ1RfAVlyVr3VmuS5W9hS0PwH4OXl4R/uVfkuNNoQ==",
+      "version": "7.6.1",
+      "resolved": "https://registry.npmjs.org/hypercore/-/hypercore-7.6.1.tgz",
+      "integrity": "sha512-ZQ1HdFXa9D5cSwXiu6vldYSE5ro6OBtyWdnFr8L/U3PFDCEpIyhyLvoRTscmP+7U2U9ZYSV3NoNHjWlNPIA8Gw==",
       "requires": {
         "array-lru": "^1.1.0",
         "atomic-batcher": "^1.0.2",
@@ -2009,7 +2034,7 @@
         "flat-tree": "^1.6.0",
         "from2": "^2.3.0",
         "hypercore-crypto": "^1.0.0",
-        "hypercore-protocol": "^6.4.1",
+        "hypercore-protocol": "^6.5.0",
         "inherits": "^2.0.3",
         "inspect-custom-symbol": "^1.1.0",
         "last-one-wins": "^1.0.4",
@@ -2054,9 +2079,9 @@
       }
     },
     "hypercore-protocol": {
-      "version": "6.11.1",
-      "resolved": "https://registry.npmjs.org/hypercore-protocol/-/hypercore-protocol-6.11.1.tgz",
-      "integrity": "sha512-4vyYGzSTRCfpIPnpYO/WN0VeS2oGeIrzCCwIXfz5TL2dyyHu7wF5xiigNuUfTn9n3cTOwwbH+EKsygTNsO2yfw==",
+      "version": "6.12.0",
+      "resolved": "https://registry.npmjs.org/hypercore-protocol/-/hypercore-protocol-6.12.0.tgz",
+      "integrity": "sha512-T3oy9/7QFejqJX2RGcCUU1944e5/eKbLlSz9JPTNN1QbYFJgat/r7eTyOO8SMSLUimUmQx6YBMKhgYbdKzp7Bw==",
       "requires": {
         "buffer-alloc-unsafe": "^1.0.0",
         "buffer-from": "^1.0.0",
@@ -2475,9 +2500,9 @@
       "integrity": "sha1-R+Y/evVa+m+S4VAOaQ64uFKcCZo="
     },
     "jpeg-js": {
-      "version": "0.3.5",
-      "resolved": "https://registry.npmjs.org/jpeg-js/-/jpeg-js-0.3.5.tgz",
-      "integrity": "sha512-hvaExqwmQDS8O9qnZAVDXGWU43Tbu1V0wMZmjROjT11jloSgGICZpscG+P6Nyi1BVAvyu2ARRx8qmEW30sxgdQ=="
+      "version": "0.3.6",
+      "resolved": "https://registry.npmjs.org/jpeg-js/-/jpeg-js-0.3.6.tgz",
+      "integrity": "sha512-MUj2XlMB8kpe+8DJUGH/3UJm4XpI8XEgZQ+CiHDeyrGoKPdW/8FJv6ku+3UiYm5Fz3CWaL+iXmD8Q4Ap6aC1Jw=="
     },
     "js-tokens": {
       "version": "3.0.2",
@@ -2574,13 +2599,14 @@
       }
     },
     "k-rpc-socket": {
-      "version": "1.8.0",
-      "resolved": "https://registry.npmjs.org/k-rpc-socket/-/k-rpc-socket-1.8.0.tgz",
-      "integrity": "sha512-f/9TynsO8YYjZ6JjNNtSSH7CJcIHcio1buy3zqByGxb/GX8AWLdL6FZEWTrN8V3/J7W4/E0ZTQQ+Jt2rVq7ELg==",
+      "version": "1.11.1",
+      "resolved": "https://registry.npmjs.org/k-rpc-socket/-/k-rpc-socket-1.11.1.tgz",
+      "integrity": "sha512-8xtA8oqbZ6v1Niryp2/g4GxW16EQh5MvrUylQoOG+zcrDff5CKttON2XUXvMwlIHq4/2zfPVFiinAccJ+WhxoA==",
       "requires": {
         "bencode": "^2.0.0",
-        "buffer-equals": "^1.0.4",
-        "safe-buffer": "^5.1.1"
+        "chrome-dgram": "^3.0.2",
+        "chrome-dns": "^1.0.0",
+        "chrome-net": "^3.3.2"
       },
       "dependencies": {
         "bencode": {
@@ -2654,9 +2680,9 @@
       }
     },
     "length-prefixed-message": {
-      "version": "3.0.3",
-      "resolved": "https://registry.npmjs.org/length-prefixed-message/-/length-prefixed-message-3.0.3.tgz",
-      "integrity": "sha1-JFR01pq8BhTco2jcNaqAdJgqI6w=",
+      "version": "3.0.4",
+      "resolved": "https://registry.npmjs.org/length-prefixed-message/-/length-prefixed-message-3.0.4.tgz",
+      "integrity": "sha512-Tqyx4nggb9nkLD6p4hyIz7UiVNg5u3OnCP2h0hS/HXpheH88rsoNEgNB8xTnpPMw6zWXGZ7Cpg1zhWPlsJ0/TQ==",
       "requires": {
         "varint": "^3.0.1"
       },
@@ -3939,6 +3965,11 @@
         "is-promise": "^2.1.0"
       }
     },
+    "run-series": {
+      "version": "1.1.8",
+      "resolved": "https://registry.npmjs.org/run-series/-/run-series-1.1.8.tgz",
+      "integrity": "sha512-+GztYEPRpIsQoCSraWHDBs9WVy4eVME16zhOtDB4H9J4xN0XRhknnmLOl+4gRgZtu8dpp9N/utSPjKH/xmDzXg=="
+    },
     "rusha": {
       "version": "0.8.13",
       "resolved": "https://registry.npmjs.org/rusha/-/rusha-0.8.13.tgz",
@@ -3983,9 +4014,9 @@
       "integrity": "sha512-NqVDv9TpANUjFm0N8uM5GxL36UgKi9/atZw+x7YFnQ8ckwFGKrl4xX4yWtrey3UJm5nP1kUbnYgLopqWNSRhWw=="
     },
     "scoped-fs": {
-      "version": "1.3.0",
-      "resolved": "https://registry.npmjs.org/scoped-fs/-/scoped-fs-1.3.0.tgz",
-      "integrity": "sha512-aH9/73pyOAuO1x5YDf7kFogD7MMLsrADRtCcKHC7fD+o7IKwzpVxgbWB6YZyCIWxfTI/+TLCw/rHMcj3B4jXdQ==",
+      "version": "1.4.1",
+      "resolved": "https://registry.npmjs.org/scoped-fs/-/scoped-fs-1.4.1.tgz",
+      "integrity": "sha512-7I9UC2eECQg1myIaDyL18j+05FjX11IkuEhkUZ0XzgJGYrkfQ1xxm6dKW0MGomGkaHMamf14uNTbNc+kvuqEFA==",
       "requires": {
         "recursive-watch": "^1.1.1"
       }
@@ -4202,14 +4233,22 @@
       }
     },
     "sodium-native": {
-      "version": "2.4.3",
-      "resolved": "https://registry.npmjs.org/sodium-native/-/sodium-native-2.4.3.tgz",
-      "integrity": "sha512-UCj3G++buo7HFADLMXyG+K7trEl6h17lde/2Sd3Al9ozcfPIQyKohmVqDncHY7ZggWkhzdwHKyDnlFWFQHZ5pg==",
+      "version": "2.4.6",
+      "resolved": "https://registry.npmjs.org/sodium-native/-/sodium-native-2.4.6.tgz",
+      "integrity": "sha512-Ro9lhTjot8M01nwKLXiqLSmjR7B8o+Wg4HmJUjEShw/q6XPlNMzjPkA1VJKaMH8SO8fJ/sggAKVwreTaFszS2Q==",
       "optional": true,
       "requires": {
         "ini": "^1.3.5",
-        "nan": "^2.4.0",
-        "node-gyp-build": "^3.0.0"
+        "nan": "^2.14.0",
+        "node-gyp-build": "^4.1.0"
+      },
+      "dependencies": {
+        "node-gyp-build": {
+          "version": "4.1.0",
+          "resolved": "https://registry.npmjs.org/node-gyp-build/-/node-gyp-build-4.1.0.tgz",
+          "integrity": "sha512-rGLv++nK20BG8gc0MzzcYe1Nl3p3mtwJ74Q2QD0HTEDKZ6NvOFSelY6s2QBPWIHRR8h7hpad0LiwajfClBJfNg==",
+          "optional": true
+        }
       }
     },
     "sodium-signatures": {