flodgatt/src/event/checked_event/status.rs

mod application;
mod attachment;
mod card;
mod poll;

use super::account::Account;
use super::emoji::Emoji;
use super::id::Id;
use super::mention::Mention;
use super::tag::Tag;
use super::visibility::Visibility;
use application::Application;
use attachment::Attachment;
use card::Card;
use poll::Poll;

use crate::request::Blocks;

use hashbrown::HashSet;
use serde::{Deserialize, Serialize};
use std::boxed::Box;
use std::string::String;

#[serde(deny_unknown_fields)]
#[derive(Serialize, Deserialize, Debug, Clone, PartialEq)]
pub struct Status {
    id: Id,
    uri: String,
    created_at: String,
    account: Account,
    content: String,
    visibility: Visibility,
    sensitive: bool,
    spoiler_text: String,
    media_attachments: Vec<Attachment>,
    application: Option<Application>, // Should be non-optional?
    mentions: Vec<Mention>,
    tags: Vec<Tag>,
    emojis: Vec<Emoji>,
    reblogs_count: i64,
    favourites_count: i64,
    replies_count: i64,
    url: Option<String>,
    in_reply_to_id: Option<Id>,
    in_reply_to_account_id: Option<Id>,
    reblog: Option<Box<Status>>,
    poll: Option<Poll>,
    card: Option<Card>,
    language: Option<String>,

    text: Option<String>,
    // ↓↓↓ Only for authorized users
    favourited: Option<bool>,
    reblogged: Option<bool>,
    muted: Option<bool>,
    bookmarked: Option<bool>,
    pinned: Option<bool>,
}

impl Status {
    /// Returns `true` if the status is filtered out based on its language
    pub(crate) fn language_not(&self, allowed_langs: &HashSet<String>) -> bool {
        const ALLOW: bool = false;
        const REJECT: bool = true;

        let reject_and_maybe_log = |toot_language| {
            log::info!("Filtering out toot from `{}`", &self.account.acct);
            log::info!("Toot language: `{}`", toot_language);
            log::info!("Recipient's allowed languages: `{:?}`", allowed_langs);
            REJECT
        };
        if allowed_langs.is_empty() {
            return ALLOW; // listing no allowed_langs results in allowing all languages
        }

        match self.language.as_ref() {
            Some(toot_language) if allowed_langs.contains(toot_language) => ALLOW,
            None => ALLOW, // If toot language is unknown, toot is always allowed
            Some(empty) if empty == &String::new() => ALLOW,
            Some(toot_language) => reject_and_maybe_log(toot_language),
        }
    }

    /// Returns `true` if the Status originated from a blocked domain, is from an account
    /// that has blocked the current user, or if the User's list of blocked/muted users
    /// includes a user involved in the Status.
    ///
    /// A user is involved in the Status/toot if they:
    ///  * Are mentioned in this toot
    ///  * Wrote this toot
    ///  * Wrote a toot that this toot is replying to (if any)
    ///  * Wrote the toot that this toot is boosting (if any)
    pub(crate) fn involves_any(&self, blocks: &Blocks) -> bool {
        const ALLOW: bool = false;
        const REJECT: bool = true;
        let Blocks {
            blocked_users,
            blocking_users,
            blocked_domains,
        } = blocks;
        let user_id = &Id(self.account.id.0);

        if blocking_users.contains(user_id) || self.involves(blocked_users) {
            REJECT
        } else {
            let full_username = &self.account.acct;
            match full_username.split('@').nth(1) {
                Some(originating_domain) if blocked_domains.contains(originating_domain) => REJECT,
                Some(_) | None => ALLOW, // None means the local instance, which can't be blocked
            }
        }
    }

    fn involves(&self, blocked_users: &HashSet<Id>) -> bool {
        // involved_users = mentioned_users + author + replied-to user + boosted user
        let mut involved_users: HashSet<Id> = self
            .mentions
            .iter()
            .map(|mention| Id(mention.id.0))
            .collect();

        // author
        involved_users.insert(Id(self.account.id.0));
        // replied-to user
        if let Some(user_id) = self.in_reply_to_account_id {
            involved_users.insert(Id(user_id.0));
        }
        // boosted user
        if let Some(boosted_status) = self.reblog.clone() {
            involved_users.insert(Id(boosted_status.account.id.0));
        }
        !involved_users.is_disjoint(blocked_users)
    }
}
Handle non conforment events (#117) * Initial implementation of DynamicEvent * Restore early Event parsing 2020-04-03 18:41:53 +02:00			`mod application;`
			`mod attachment;`
			`mod card;`
			`mod poll;`

Update module privacy (#133) This squashed commit rolls up a series of changes designed to improve Flodgatt's public API/module boundary. Specifically, this limits the number of Items that are exported outside the top-level modules (in some cases because they were already not needed outside that module due to the earlier code reorganization and in some cases by using public re-exports to export particular Items from a private module). Similarly, this commit moves the `Event` struct to the `response` module (maintaining privacy for the `Event`'s implementation details) while re-exporting the `Id` struct that `Event` uses internally at the top level. All of these changes are made with the goal of making Flodgatt's code easier to reason about in isolation, which should both make it easier to maintain and make it easier for new contributors to make changes without understanding the entire codebase. Additionally, having fewer public modules will make documenting Flodgatt more extensively much easier. 2020-04-21 22:39:31 +02:00			`use super::account::Account;`
			`use super::emoji::Emoji;`
			`use super::id::Id;`
			`use super::mention::Mention;`
			`use super::tag::Tag;`
			`use super::visibility::Visibility;`
			`use application::Application;`
			`use attachment::Attachment;`
			`use card::Card;`
			`use poll::Poll;`
Handle non conforment events (#117) * Initial implementation of DynamicEvent * Restore early Event parsing 2020-04-03 18:41:53 +02:00
Code reorganization (#130) * Reorganize files * Refactor main() * Code reorganization [WIP] * Reorganize code [WIP] * Refacto RedisConn [WIP] * Complete code reorganization 2020-04-13 22:03:06 +02:00			`use crate::request::Blocks;`
Handle non conforment events (#117) * Initial implementation of DynamicEvent * Restore early Event parsing 2020-04-03 18:41:53 +02:00
Minor performance tune (#127) * Tweak release profile & micro optimizations * Replace std HashMap with hashbrown::HashMap The hashbrown::HashMap is faster than the std::collections::HashMap, though it does not protect as well against malicious hash collisions (e.g., in a DDoS). Since we don't expose the hashing externally, we should switch to the faster implementation. 2020-04-09 00:39:52 +02:00			`use hashbrown::HashSet;`
Handle non conforment events (#117) * Initial implementation of DynamicEvent * Restore early Event parsing 2020-04-03 18:41:53 +02:00			`use serde::{Deserialize, Serialize};`
			`use std::boxed::Box;`
Minor performance tune (#127) * Tweak release profile & micro optimizations * Replace std HashMap with hashbrown::HashMap The hashbrown::HashMap is faster than the std::collections::HashMap, though it does not protect as well against malicious hash collisions (e.g., in a DDoS). Since we don't expose the hashing externally, we should switch to the faster implementation. 2020-04-09 00:39:52 +02:00			`use std::string::String;`
Handle non conforment events (#117) * Initial implementation of DynamicEvent * Restore early Event parsing 2020-04-03 18:41:53 +02:00
			`#[serde(deny_unknown_fields)]`
			`#[derive(Serialize, Deserialize, Debug, Clone, PartialEq)]`
			`pub struct Status {`
Error handling pt2 (#129) This commit improves error handling in Flodgatt's main request-response loop, including the portions of that loop that were revised in #128. This nearly completes the addition of more explicit error handling, but there will be a smaller part 3 to bring the handling of configuration/Postgres errors into conformity with the style here. 2020-04-11 04:36:03 +02:00			`id: Id,`
Handle non conforment events (#117) * Initial implementation of DynamicEvent * Restore early Event parsing 2020-04-03 18:41:53 +02:00			`uri: String,`
			`created_at: String,`
			`account: Account,`
			`content: String,`
			`visibility: Visibility,`
			`sensitive: bool,`
			`spoiler_text: String,`
			`media_attachments: Vec<Attachment>,`
			`application: Option<Application>, // Should be non-optional?`
			`mentions: Vec<Mention>,`
			`tags: Vec<Tag>,`
			`emojis: Vec<Emoji>,`
			`reblogs_count: i64,`
			`favourites_count: i64,`
			`replies_count: i64,`
			`url: Option<String>,`
Error handling pt2 (#129) This commit improves error handling in Flodgatt's main request-response loop, including the portions of that loop that were revised in #128. This nearly completes the addition of more explicit error handling, but there will be a smaller part 3 to bring the handling of configuration/Postgres errors into conformity with the style here. 2020-04-11 04:36:03 +02:00			`in_reply_to_id: Option<Id>,`
			`in_reply_to_account_id: Option<Id>,`
Handle non conforment events (#117) * Initial implementation of DynamicEvent * Restore early Event parsing 2020-04-03 18:41:53 +02:00			`reblog: Option<Box<Status>>,`
			`poll: Option<Poll>,`
			`card: Option<Card>,`
			`language: Option<String>,`
Stream events via a watch channel (#128) This squashed commit makes a fairly significant structural change to significantly reduce Flodgatt's CPU usage. Flodgatt connects to Redis in a single (green) thread, and then creates a new thread to handle each WebSocket/SSE connection. Previously, each thread was responsible for polling the Redis thread to determine whether it had a message relevant to the connected client. I initially selected this structure both because it was simple and because it minimized memory overhead – no messages are sent to a particular thread unless they are relevant to the client connected to the thread. However, I recently ran some load tests that show this approach to have unacceptable CPU costs when 300+ clients are simultaneously connected. Accordingly, Flodgatt now uses a different structure: the main Redis thread now announces each incoming message via a watch channel connected to every client thread, and each client thread filters out irrelevant messages. In theory, this could lead to slightly higher memory use, but tests I have run so far have not found a measurable increase. On the other hand, Flodgatt's CPU use is now an order of magnitude lower in tests I've run. This approach does run a (very slight) risk of dropping messages under extremely heavy load: because a watch channel only stores the most recent message transmitted, if Flodgatt adds a second message before the thread can read the first message, the first message will be overwritten and never transmitted. This seems unlikely to happen in practice, and we can avoid the issue entirely by changing to a broadcast channel when we upgrade to the most recent Tokio version (see #75). 2020-04-09 19:32:36 +02:00
Handle non conforment events (#117) * Initial implementation of DynamicEvent * Restore early Event parsing 2020-04-03 18:41:53 +02:00			`text: Option<String>,`
			`// ↓↓↓ Only for authorized users`
			`favourited: Option<bool>,`
			`reblogged: Option<bool>,`
			`muted: Option<bool>,`
			`bookmarked: Option<bool>,`
			`pinned: Option<bool>,`
			`}`

			`impl Status {`
			/// Returns `true` if the status is filtered out based on its language
Update module privacy (#133) This squashed commit rolls up a series of changes designed to improve Flodgatt's public API/module boundary. Specifically, this limits the number of Items that are exported outside the top-level modules (in some cases because they were already not needed outside that module due to the earlier code reorganization and in some cases by using public re-exports to export particular Items from a private module). Similarly, this commit moves the `Event` struct to the `response` module (maintaining privacy for the `Event`'s implementation details) while re-exporting the `Id` struct that `Event` uses internally at the top level. All of these changes are made with the goal of making Flodgatt's code easier to reason about in isolation, which should both make it easier to maintain and make it easier for new contributors to make changes without understanding the entire codebase. Additionally, having fewer public modules will make documenting Flodgatt more extensively much easier. 2020-04-21 22:39:31 +02:00			`pub(crate) fn language_not(&self, allowed_langs: &HashSet<String>) -> bool {`
Handle non conforment events (#117) * Initial implementation of DynamicEvent * Restore early Event parsing 2020-04-03 18:41:53 +02:00			`const ALLOW: bool = false;`
			`const REJECT: bool = true;`

			`let reject_and_maybe_log = \|toot_language\| {`
			log::info!("Filtering out toot from `{}`", &self.account.acct);
			log::info!("Toot language: `{}`", toot_language);
			log::info!("Recipient's allowed languages: `{:?}`", allowed_langs);
			`REJECT`
			`};`
			`if allowed_langs.is_empty() {`
			`return ALLOW; // listing no allowed_langs results in allowing all languages`
			`}`

			`match self.language.as_ref() {`
			`Some(toot_language) if allowed_langs.contains(toot_language) => ALLOW,`
			`None => ALLOW, // If toot language is unknown, toot is always allowed`
			`Some(empty) if empty == &String::new() => ALLOW,`
			`Some(toot_language) => reject_and_maybe_log(toot_language),`
			`}`
			`}`

			/// Returns `true` if the Status originated from a blocked domain, is from an account
			`/// that has blocked the current user, or if the User's list of blocked/muted users`
			`/// includes a user involved in the Status.`
			`///`
			`/// A user is involved in the Status/toot if they:`
			`/// * Are mentioned in this toot`
			`/// * Wrote this toot`
			`/// * Wrote a toot that this toot is replying to (if any)`
			`/// * Wrote the toot that this toot is boosting (if any)`
Update module privacy (#133) This squashed commit rolls up a series of changes designed to improve Flodgatt's public API/module boundary. Specifically, this limits the number of Items that are exported outside the top-level modules (in some cases because they were already not needed outside that module due to the earlier code reorganization and in some cases by using public re-exports to export particular Items from a private module). Similarly, this commit moves the `Event` struct to the `response` module (maintaining privacy for the `Event`'s implementation details) while re-exporting the `Id` struct that `Event` uses internally at the top level. All of these changes are made with the goal of making Flodgatt's code easier to reason about in isolation, which should both make it easier to maintain and make it easier for new contributors to make changes without understanding the entire codebase. Additionally, having fewer public modules will make documenting Flodgatt more extensively much easier. 2020-04-21 22:39:31 +02:00			`pub(crate) fn involves_any(&self, blocks: &Blocks) -> bool {`
Handle non conforment events (#117) * Initial implementation of DynamicEvent * Restore early Event parsing 2020-04-03 18:41:53 +02:00			`const ALLOW: bool = false;`
			`const REJECT: bool = true;`
			`let Blocks {`
			`blocked_users,`
			`blocking_users,`
			`blocked_domains,`
			`} = blocks;`
Error handling pt2 (#129) This commit improves error handling in Flodgatt's main request-response loop, including the portions of that loop that were revised in #128. This nearly completes the addition of more explicit error handling, but there will be a smaller part 3 to bring the handling of configuration/Postgres errors into conformity with the style here. 2020-04-11 04:36:03 +02:00			`let user_id = &Id(self.account.id.0);`
Handle non conforment events (#117) * Initial implementation of DynamicEvent * Restore early Event parsing 2020-04-03 18:41:53 +02:00
Stream events via a watch channel (#128) This squashed commit makes a fairly significant structural change to significantly reduce Flodgatt's CPU usage. Flodgatt connects to Redis in a single (green) thread, and then creates a new thread to handle each WebSocket/SSE connection. Previously, each thread was responsible for polling the Redis thread to determine whether it had a message relevant to the connected client. I initially selected this structure both because it was simple and because it minimized memory overhead – no messages are sent to a particular thread unless they are relevant to the client connected to the thread. However, I recently ran some load tests that show this approach to have unacceptable CPU costs when 300+ clients are simultaneously connected. Accordingly, Flodgatt now uses a different structure: the main Redis thread now announces each incoming message via a watch channel connected to every client thread, and each client thread filters out irrelevant messages. In theory, this could lead to slightly higher memory use, but tests I have run so far have not found a measurable increase. On the other hand, Flodgatt's CPU use is now an order of magnitude lower in tests I've run. This approach does run a (very slight) risk of dropping messages under extremely heavy load: because a watch channel only stores the most recent message transmitted, if Flodgatt adds a second message before the thread can read the first message, the first message will be overwritten and never transmitted. This seems unlikely to happen in practice, and we can avoid the issue entirely by changing to a broadcast channel when we upgrade to the most recent Tokio version (see #75). 2020-04-09 19:32:36 +02:00			`if blocking_users.contains(user_id) \|\| self.involves(blocked_users) {`
Handle non conforment events (#117) * Initial implementation of DynamicEvent * Restore early Event parsing 2020-04-03 18:41:53 +02:00			`REJECT`
			`} else {`
			`let full_username = &self.account.acct;`
			`match full_username.split('@').nth(1) {`
			`Some(originating_domain) if blocked_domains.contains(originating_domain) => REJECT,`
			`Some(_) \| None => ALLOW, // None means the local instance, which can't be blocked`
			`}`
			`}`
			`}`

Error handling pt2 (#129) This commit improves error handling in Flodgatt's main request-response loop, including the portions of that loop that were revised in #128. This nearly completes the addition of more explicit error handling, but there will be a smaller part 3 to bring the handling of configuration/Postgres errors into conformity with the style here. 2020-04-11 04:36:03 +02:00			`fn involves(&self, blocked_users: &HashSet<Id>) -> bool {`
Handle non conforment events (#117) * Initial implementation of DynamicEvent * Restore early Event parsing 2020-04-03 18:41:53 +02:00			`// involved_users = mentioned_users + author + replied-to user + boosted user`
Error handling pt2 (#129) This commit improves error handling in Flodgatt's main request-response loop, including the portions of that loop that were revised in #128. This nearly completes the addition of more explicit error handling, but there will be a smaller part 3 to bring the handling of configuration/Postgres errors into conformity with the style here. 2020-04-11 04:36:03 +02:00			`let mut involved_users: HashSet<Id> = self`
Handle non conforment events (#117) * Initial implementation of DynamicEvent * Restore early Event parsing 2020-04-03 18:41:53 +02:00			`.mentions`
			`.iter()`
Error handling pt2 (#129) This commit improves error handling in Flodgatt's main request-response loop, including the portions of that loop that were revised in #128. This nearly completes the addition of more explicit error handling, but there will be a smaller part 3 to bring the handling of configuration/Postgres errors into conformity with the style here. 2020-04-11 04:36:03 +02:00			`.map(\|mention\| Id(mention.id.0))`
Handle non conforment events (#117) * Initial implementation of DynamicEvent * Restore early Event parsing 2020-04-03 18:41:53 +02:00			`.collect();`

			`// author`
Error handling pt2 (#129) This commit improves error handling in Flodgatt's main request-response loop, including the portions of that loop that were revised in #128. This nearly completes the addition of more explicit error handling, but there will be a smaller part 3 to bring the handling of configuration/Postgres errors into conformity with the style here. 2020-04-11 04:36:03 +02:00			`involved_users.insert(Id(self.account.id.0));`
Handle non conforment events (#117) * Initial implementation of DynamicEvent * Restore early Event parsing 2020-04-03 18:41:53 +02:00			`// replied-to user`
Error handling pt2 (#129) This commit improves error handling in Flodgatt's main request-response loop, including the portions of that loop that were revised in #128. This nearly completes the addition of more explicit error handling, but there will be a smaller part 3 to bring the handling of configuration/Postgres errors into conformity with the style here. 2020-04-11 04:36:03 +02:00			`if let Some(user_id) = self.in_reply_to_account_id {`
			`involved_users.insert(Id(user_id.0));`
Handle non conforment events (#117) * Initial implementation of DynamicEvent * Restore early Event parsing 2020-04-03 18:41:53 +02:00			`}`
			`// boosted user`
			`if let Some(boosted_status) = self.reblog.clone() {`
Error handling pt2 (#129) This commit improves error handling in Flodgatt's main request-response loop, including the portions of that loop that were revised in #128. This nearly completes the addition of more explicit error handling, but there will be a smaller part 3 to bring the handling of configuration/Postgres errors into conformity with the style here. 2020-04-11 04:36:03 +02:00			`involved_users.insert(Id(boosted_status.account.id.0));`
Handle non conforment events (#117) * Initial implementation of DynamicEvent * Restore early Event parsing 2020-04-03 18:41:53 +02:00			`}`
Stream events via a watch channel (#128) This squashed commit makes a fairly significant structural change to significantly reduce Flodgatt's CPU usage. Flodgatt connects to Redis in a single (green) thread, and then creates a new thread to handle each WebSocket/SSE connection. Previously, each thread was responsible for polling the Redis thread to determine whether it had a message relevant to the connected client. I initially selected this structure both because it was simple and because it minimized memory overhead – no messages are sent to a particular thread unless they are relevant to the client connected to the thread. However, I recently ran some load tests that show this approach to have unacceptable CPU costs when 300+ clients are simultaneously connected. Accordingly, Flodgatt now uses a different structure: the main Redis thread now announces each incoming message via a watch channel connected to every client thread, and each client thread filters out irrelevant messages. In theory, this could lead to slightly higher memory use, but tests I have run so far have not found a measurable increase. On the other hand, Flodgatt's CPU use is now an order of magnitude lower in tests I've run. This approach does run a (very slight) risk of dropping messages under extremely heavy load: because a watch channel only stores the most recent message transmitted, if Flodgatt adds a second message before the thread can read the first message, the first message will be overwritten and never transmitted. This seems unlikely to happen in practice, and we can avoid the issue entirely by changing to a broadcast channel when we upgrade to the most recent Tokio version (see #75). 2020-04-09 19:32:36 +02:00			`!involved_users.is_disjoint(blocked_users)`
Handle non conforment events (#117) * Initial implementation of DynamicEvent * Restore early Event parsing 2020-04-03 18:41:53 +02:00			`}`
			`}`