Documentation ¶
Index ¶
- type Configuration
- type DBConfiguration
- type DuplicateDetectorConfiguration
- type FeedsFetchingConfiguration
- type GDELTFetchingConfiguration
- type LogLevel
- type RabbitMQConfiguration
- type TweetsFetchingConfiguration
- type VectorizerConfiguration
- type WebScrapingConfiguration
- type ZeroShotClassificationConfiguration
Constants ¶
This section is empty.
Variables ¶
This section is empty.
Functions ¶
This section is empty.
Types ¶
type Configuration ¶
type Configuration struct { LogLevel LogLevel `yaml:"log_level"` DB DBConfiguration RabbitMQ RabbitMQConfiguration FeedsFetching FeedsFetchingConfiguration `yaml:"feeds_fetching"` GDELTFetching GDELTFetchingConfiguration `yaml:"gdelt_fetching"` TweetsFetching TweetsFetchingConfiguration `yaml:"tweets_fetching"` WebScraping WebScrapingConfiguration `yaml:"web_scraping"` DuplicateDetector DuplicateDetectorConfiguration `yaml:"duplicate_detector"` Vectorizer VectorizerConfiguration `yaml:"vectorizer"` ZeroShotClassification ZeroShotClassificationConfiguration `yaml:"zero_shot_classification"` SupportedLanguages []string `yaml:"supported_languages"` }
Configuration provides app-wide settings.
func FromYAMLFile ¶
func FromYAMLFile(filename string) (config Configuration, err error)
FromYAMLFile reads a Configuration object from a YAML file.
func (*Configuration) LanguageIsSupported ¶
func (c *Configuration) LanguageIsSupported(code string) bool
type DBConfiguration ¶
type DBConfiguration struct {
DSN string
}
DBConfiguration provides database-specific settings.
type DuplicateDetectorConfiguration ¶
type DuplicateDetectorConfiguration struct { TimeframeHours int `yaml:"timeframe_hours"` SimilarityThreshold float32 `yaml:"similarity_threshold"` SubQueueName string `yaml:"sub_queue_name"` SubRoutingKey string `yaml:"sub_routing_key"` PubNewEventRoutingKey string `yaml:"pub_new_event_routing_key"` PubNewRelatedRoutingKey string `yaml:"pub_new_related_routing_key"` }
DuplicateDetectorConfiguration provides specific settings for near-duplicate web articles detection.
type FeedsFetchingConfiguration ¶
type FeedsFetchingConfiguration struct { NumWorkers int `yaml:"num_workers"` MaxAllowedFailures int `yaml:"max_allowed_failures"` SleepingTime time.Duration `yaml:"sleeping_time"` OmitFeedItemsPublishedBeforeEnabled bool `yaml:"omit_feed_items_published_before_enabled"` OmitFeedItemsPublishedBefore time.Time `yaml:"omit_feed_items_published_before"` NewWebResourceRoutingKey string `yaml:"new_web_resource_routing_key"` NewFeedItemRoutingKey string `yaml:"new_feed_item_routing_key"` }
FeedsFetchingConfiguration provides specific settings for the feeds-fetching operation.
type GDELTFetchingConfiguration ¶
type GDELTFetchingConfiguration struct { SleepingTime time.Duration `yaml:"sleeping_time"` NewWebResourceRoutingKey string `yaml:"new_web_resource_routing_key"` NewGDELTEventRoutingKey string `yaml:"new_gdelt_event_routing_key"` TopLevelCameoEventCodeWhitelist []string `yaml:"top_level_cameo_event_code_whitelist"` }
GDELTFetchingConfiguration provides specific settings for the GDELT-fetching operation.
type LogLevel ¶
LogLevel is a redefinition of zerolog.Level which satisfies encoding.TextUnmarshaler.
func (*LogLevel) UnmarshalText ¶
UnmarshalText unmarshals the text to a LogLevel.
type RabbitMQConfiguration ¶
RabbitMQConfiguration provides RabbitMQ-specific settings.
type TweetsFetchingConfiguration ¶ added in v0.3.0
type TweetsFetchingConfiguration struct { NumWorkers int `yaml:"num_workers"` SleepingTime time.Duration `yaml:"sleeping_time"` OmitTweetsPublishedBeforeEnabled bool `yaml:"omit_tweets_published_before_enabled"` OmitTweetsPublishedBefore time.Time `yaml:"omit_tweets_published_before"` NewWebResourceRoutingKey string `yaml:"new_web_resource_routing_key"` NewTweetRoutingKey string `yaml:"new_tweet_routing_key"` NewWebArticleRoutingKey string `yaml:"new_web_article_routing_key"` }
TweetsFetchingConfiguration provides specific settings for the tweets-fetching operation.
type VectorizerConfiguration ¶
type VectorizerConfiguration struct { NumWorkers int `yaml:"num_workers"` SubQueueName string `yaml:"sub_queue_name"` SubNewWebArticleRoutingKey string `yaml:"sub_new_web_article_routing_key"` PubNewVectorizedWebArticleRoutingKey string `yaml:"pub_new_vectorized_web_article_routing_key"` LabseGrpcAddress string `yaml:"labse_grpc_address"` LabseTLSDisable bool `yaml:"labse_tls_disable"` }
VectorizerConfiguration provides specific settings for the vectorization operation.
type WebScrapingConfiguration ¶
type WebScrapingConfiguration struct { NumWorkers int `yaml:"num_workers"` SubQueueName string `yaml:"sub_queue_name"` SubNewWebResourceRoutingKey string `yaml:"sub_new_web_resource_routing_key"` PubNewWebArticleRoutingKey string `yaml:"pub_new_web_article_routing_key"` }
WebScrapingConfiguration provides specific settings for the Web Resource URLs scraping operation.
type ZeroShotClassificationConfiguration ¶
type ZeroShotClassificationConfiguration struct { NumWorkers int `yaml:"num_workers"` SubQueueName string `yaml:"sub_queue_name"` SubRoutingKey string `yaml:"sub_routing_key"` PubRoutingKey string `yaml:"pub_routing_key"` PayloadKey string `yaml:"payload_key"` ZeroShotGRPCAddress string `yaml:"zero_shot_grpc_address"` GRPCTLSDisable bool `yaml:"grpc_tls_disable"` HypothesisTemplate string `yaml:"hypothesis_template"` PossibleLabels []string `yaml:"possible_labels"` MultiClass bool `yaml:"multi_class"` }
ZeroShotClassificationConfiguration provides specific settings for spaGO zero-shot classification operation.