Merge pull request #7 from interfect/revanced-compat

Make compatible with ReVanced
This commit is contained in:
Kavin 2022-10-30 18:51:46 +00:00 committed by GitHub
commit 7053e0bb14
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
6 changed files with 174 additions and 55 deletions

View file

@ -13,3 +13,41 @@ It also uses [sb-mirror](https://github.com/mchangrh/sb-mirror) for mirroring th
Feel free to add your instance to this list by making a pull request. Feel free to add your instance to this list by making a pull request.
You can also configure Piped-Backend to use your mirror by changing the `SPONSORBLOCK_SERVERS` configuration value. You can also configure Piped-Backend to use your mirror by changing the `SPONSORBLOCK_SERVERS` configuration value.
## Compatibility
This implementation does not implement the full SponsorBlock server API. It supports hash-based queries to `/api/skipSegments/<hash>`, with optional `categories` parameter, and queries to `/api/skipSegments` with required `videoID` and optional `categories` parameters.
The browser extension works with only the hash-based query endpoint, but other clients, such as the one in ReVanced, require the video ID endpoint, and additionally query `/api/userInfo` and `/api/isUserVip`. Right now there are stub implementations for these. ReVanced had not yet been verified as compatible.
## Using with Docker Compose
To run the server under Docker Compose, run:
```
docker compose up
```
This starts the API server, a database, and a mirroring service to download the SponsorBlock data from the `sponsorblock.kavin.rocks` mirror and keep it up to date.
The API will be available on `http://localhost:8000`. For example, you can try `http://localhost:8000/api/skipSegments/aabf` or `http://localhost:8000/api/skipSegments?videoID=eQ_8F4nzyiw`. **It will take a few minutes at least for the database to download and import,** so these will not return data on the first run.
## Building
To make a local release build, use `cargo build --release`. This will produce a binary in `target/release/sponsorblock-mirror`.
To make a Docker container, you need to do a BuildKit Docker build, not a normal Docker build. Make sure you have `buildx` available in your Docker, and run:
```bash
docker buildx build --load -t 1337kavin/sponsorblock-mirror .
```
## Troubleshooting
* If the linker complains about a missing `-lpq`, make sure you have the PostgreSQL development libraries, which may be in a `libpq-dev` package or your distribution's equivalent.
* If Docker complains that `the --mount option requires BuildKit`, make sure you are building with `docker buildx build` and not `docker build`.
* To access the PostgreSQL database directly, you can `docker exec -ti postgres-sb-mirror bash -c 'psql $POSTGRES_DB $POSTGRES_USER'`.
* Requests for videos not in the database are forwarded to `https://sponsor.ajay.app/`, which may be down or malfunctioning. A response of the string `Internal Server Error` is likely to be from there, rather than from this application.

View file

@ -1,3 +1,5 @@
version: "3"
services: services:
sb-mirror: sb-mirror:
image: mchangrh/sb-mirror:latest image: mchangrh/sb-mirror:latest

View file

@ -0,0 +1 @@
DROP INDEX IF EXISTS "sponsor_video_id_idx";

View file

@ -0,0 +1 @@
CREATE INDEX sponsor_video_id_idx ON "sponsorTimes"("videoID");

View file

@ -14,7 +14,7 @@ use tokio::time::interval;
use structs::{Segment, Sponsor}; use structs::{Segment, Sponsor};
use crate::routes::skip_segments; use crate::routes::{skip_segments, skip_segments_by_id, fake_is_user_vip, fake_user_info};
mod models; mod models;
mod routes; mod routes;
@ -125,5 +125,5 @@ fn rocket() -> Rocket<Build> {
}) })
}) })
).attach(CORS) ).attach(CORS)
.mount("/", routes![skip_segments]) .mount("/", routes![skip_segments, skip_segments_by_id, fake_is_user_vip, fake_user_info])
} }

View file

@ -6,34 +6,115 @@ use rocket::response::content;
use crate::{Db, Segment, Sponsor}; use crate::{Db, Segment, Sponsor};
use crate::models::SponsorTime; use crate::models::SponsorTime;
use crate::schema::sponsorTimes::dsl::*; // We *must* use "videoID" as an argument name to get Rocket to let us access
// the query parameter by that name, but if videoID is already used we
// can't do that.
use crate::schema::sponsorTimes::dsl::{
sponsorTimes,
shadowHidden,
hidden,
votes,
category,
hashedVideoID,
videoID as column_videoID
};
// init regex to match hash/hex // init regexes to match hash/hex or video ID
lazy_static! { lazy_static! {
static ref RE: regex::Regex = regex::Regex::new(r"^[0-9a-f]{4}$").unwrap(); static ref HASH_RE: regex::Regex = regex::Regex::new(r"^[0-9a-f]{4}$").unwrap();
static ref ID_RE: regex::Regex = regex::Regex::new(r"^[a-zA-Z0-9_-]{6,11}$").unwrap();
} }
// Segments can be fetched either by full video ID, or by prefix of hashed
// video ID. Different clients make different queries. This represents either
// kind of constraint.
enum VideoName {
ByHashPrefix(String),
ByID(String),
}
#[get("/api/skipSegments/<hash>?<categories>")] #[get("/api/skipSegments/<hash>?<categories>")]
pub async fn skip_segments( pub async fn skip_segments(
hash: String, hash: String,
categories: Option<&str>, categories: Option<&str>,
db: Db, db: Db,
) -> content::RawJson<String> { ) -> content::RawJson<String> {
let hash = hash.to_lowercase(); let hash = hash.to_lowercase();
// Check if hash matches hex regex // Check if hash matches hex regex
if !RE.is_match(&hash) { if !HASH_RE.is_match(&hash) {
return content::RawJson("Hash prefix does not match format requirements.".to_string()); return content::RawJson("Hash prefix does not match format requirements.".to_string());
} }
let hc = hash.clone(); let sponsors = find_skip_segments(VideoName::ByHashPrefix(hash.clone()), categories, db).await;
if sponsors.is_empty() {
// Fall back to central Sponsorblock server
let resp = reqwest::get(format!(
"https://sponsor.ajay.app/api/skipSegments/{}?categories={}",
hash,
categories.unwrap_or("[\"sponsor\"]"),
))
.await
.unwrap()
.text()
.await
.unwrap();
return content::RawJson(resp);
}
return content::RawJson(serde_json::to_string(&sponsors).unwrap());
}
#[get("/api/skipSegments?<videoID>&<categories>")]
pub async fn skip_segments_by_id(
#[allow(non_snake_case)]
videoID: String,
categories: Option<&str>,
db: Db,
) -> content::RawJson<String> {
// Check if ID matches ID regex
if !ID_RE.is_match(&videoID) {
return content::RawJson("videoID does not match format requirements".to_string());
}
let sponsors = find_skip_segments(VideoName::ByID(videoID.clone()), categories, db).await;
if sponsors.is_empty() {
// Fall back to central Sponsorblock server
let resp = reqwest::get(format!(
"https://sponsor.ajay.app/api/skipSegments?videoID={}&categories={}",
videoID,
categories.unwrap_or("[\"sponsor\"]"),
))
.await
.unwrap()
.text()
.await
.unwrap();
return content::RawJson(resp);
}
// Doing a lookup by video ID should return only one Sponsor object with
// one list of segments. We need to return just the list of segments.
return content::RawJson(serde_json::to_string(&sponsors[0].segments).unwrap());
}
async fn find_skip_segments(
name: VideoName,
categories: Option<&str>,
db: Db,
) -> Vec<Sponsor> {
let cat: Vec<String> = serde_json::from_str(categories.unwrap_or("[\"sponsor\"]")).unwrap(); let cat: Vec<String> = serde_json::from_str(categories.unwrap_or("[\"sponsor\"]")).unwrap();
if cat.is_empty() { if cat.is_empty() {
return content::RawJson( return Vec::new();
"[]".to_string(),
);
} }
let results: Vec<SponsorTime> = db.run(move |conn| { let results: Vec<SponsorTime> = db.run(move |conn| {
@ -41,16 +122,18 @@ pub async fn skip_segments(
.filter(shadowHidden.eq(0)) .filter(shadowHidden.eq(0))
.filter(hidden.eq(0)) .filter(hidden.eq(0))
.filter(votes.ge(0)) .filter(votes.ge(0))
.filter(hashedVideoID.like(format!("{}%", hc))); .filter(category.eq_any(cat)); // We know cat isn't empty at this point
let queried = { let queried = match name {
if cat.is_empty() { VideoName::ByHashPrefix(hash_prefix) => {
base_filter base_filter
.filter(hashedVideoID.like(format!("{}%", hash_prefix)))
.get_results::<SponsorTime>(conn) .get_results::<SponsorTime>(conn)
.expect("Failed to query sponsor times") .expect("Failed to query sponsor times")
} else { }
VideoName::ByID(video_id) => {
base_filter base_filter
.filter(category.eq_any(cat)) .filter(column_videoID.eq(video_id))
.get_results::<SponsorTime>(conn) .get_results::<SponsorTime>(conn)
.expect("Failed to query sponsor times") .expect("Failed to query sponsor times")
} }
@ -71,17 +154,7 @@ pub async fn skip_segments(
}) })
}; };
let segment = Segment { let segment = build_segment(result);
uuid: result.uuid.clone(),
action_type: result.action_type.clone(),
category: result.category.clone(),
description: result.description.clone(),
locked: result.locked,
segment: vec![result.start_time, result.end_time],
user_id: result.user_id.clone(),
video_duration: result.video_duration,
votes: result.votes,
};
let hash = result.hashed_video_id.clone(); let hash = result.hashed_video_id.clone();
@ -113,23 +186,7 @@ pub async fn skip_segments(
sponsor.segments.sort_by(|a, b| a.partial_cmp(b).unwrap()); sponsor.segments.sort_by(|a, b| a.partial_cmp(b).unwrap());
} }
if !sponsors.is_empty() { return sponsors.into_values().collect();
let sponsors: Vec<&Sponsor> = sponsors.values().collect();
return content::RawJson(serde_json::to_string(&sponsors).unwrap());
}
let resp = reqwest::get(format!(
"https://sponsor.ajay.app/api/skipSegments/{}?categories={}",
hash,
categories.unwrap_or("[]"),
))
.await
.unwrap()
.text()
.await
.unwrap();
return content::RawJson(resp);
} }
fn similar_segments(segment: &Segment, hash: &str, segments: &Vec<SponsorTime>) -> Vec<Segment> { fn similar_segments(segment: &Segment, hash: &str, segments: &Vec<SponsorTime>) -> Vec<Segment> {
@ -147,17 +204,7 @@ fn similar_segments(segment: &Segment, hash: &str, segments: &Vec<SponsorTime>)
let is_similar = is_overlap(segment, &seg.category, &seg.action_type, seg.start_time, seg.end_time); let is_similar = is_overlap(segment, &seg.category, &seg.action_type, seg.start_time, seg.end_time);
if is_similar { if is_similar {
similar_segments.push(Segment { similar_segments.push(build_segment(seg));
uuid: seg.uuid.clone(),
action_type: seg.action_type.clone(),
category: seg.category.clone(),
description: seg.description.clone(),
locked: seg.locked,
segment: vec![seg.start_time, seg.end_time],
user_id: seg.user_id.clone(),
video_duration: seg.video_duration,
votes: seg.votes,
});
} }
} }
@ -198,3 +245,33 @@ fn best_segment(segments: &Vec<Segment>) -> Segment {
best_segment best_segment
} }
fn build_segment (sponsor_time: &SponsorTime) -> Segment {
Segment {
uuid: sponsor_time.uuid.clone(),
action_type: sponsor_time.action_type.clone(),
category: sponsor_time.category.clone(),
description: sponsor_time.description.clone(),
locked: sponsor_time.locked,
segment: vec![sponsor_time.start_time, sponsor_time.end_time],
user_id: sponsor_time.user_id.clone(),
video_duration: sponsor_time.video_duration,
votes: sponsor_time.votes,
}
}
// These additional routes are faked to protect ReVanced from seeing errors. We
// don't *need* to do this to support ReVanced, but it gets rid of the
// perpetual "Loading..." in the settings.
// This would take a userID
#[get("/api/isUserVIP")]
pub async fn fake_is_user_vip() -> content::RawJson<String> {
content::RawJson("{\"hashedUserID\": \"\", \"vip\": false}".to_string())
}
// This would take a userID and an optional list values
#[get("/api/userInfo")]
pub async fn fake_user_info() -> content::RawJson<String> {
content::RawJson("{\"userID\": \"\", \"userName\": \"\", \"minutesSaved\": 0, \"segmentCount\": 0, \"viewCount\": 0}".to_string())
}