Skip to content

Commit

Permalink
Merge pull request #33 from nlnwa/timeout
Browse files Browse the repository at this point in the history
Add option for setting timeout on crawlSeed request to Frontier
  • Loading branch information
maeb authored Oct 28, 2020
2 parents d38b8d6 + af9c582 commit ee3d429
Show file tree
Hide file tree
Showing 2 changed files with 3 additions and 2 deletions.
3 changes: 3 additions & 0 deletions protobuf/frontier/v1/frontier.proto
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,7 @@ import "commons/v1/resources.proto";
import "config/v1/resources.proto";
import "frontier/v1/resources.proto";
import "google/protobuf/empty.proto";
import "google/protobuf/timestamp.proto";

option go_package = "github.com/nlnwa/veidemann-api-go/frontier/v1;frontier";
option java_multiple_files = true;
Expand Down Expand Up @@ -38,6 +39,8 @@ message CrawlSeedRequest {
string job_execution_id = 1;
veidemann.api.config.v1.ConfigObject job = 5;
veidemann.api.config.v1.ConfigObject seed = 6;
// When this seed should stop crawling. Absence of this value indicates no timeout
google.protobuf.Timestamp timeout = 7;
}

// The execution id for a seed crawl
Expand Down
2 changes: 0 additions & 2 deletions protobuf/frontier/v1/resources.proto
Original file line number Diff line number Diff line change
Expand Up @@ -72,8 +72,6 @@ message Cookie {
message CrawlHostGroup {
string id = 1; // SHA-1 hash of uri or crawlgroup config id
string politeness_id = 2; // The politeness config this group is valid for
google.protobuf.Timestamp next_fetch_time = 3; // The earliest time a URI from this group might be fetched
bool busy = 4; // True if crawler is busy with fetching a URI from this group
int64 queued_uri_count = 5; // The number of queued Uri's belonging to this CrawlHostGroup
}

Expand Down

0 comments on commit ee3d429

Please sign in to comment.