merge: phase 12 resolve conflicts

This commit is contained in:
salvacybersec
2026-04-06 12:27:23 +03:00
12 changed files with 3107 additions and 0 deletions

View File

@@ -0,0 +1,147 @@
package sources
import (
"context"
"encoding/json"
"errors"
"fmt"
"net/http"
"net/url"
"strings"
"time"
"golang.org/x/time/rate"
"github.com/salvacybersec/keyhunter/pkg/providers"
"github.com/salvacybersec/keyhunter/pkg/recon"
)
// BinaryEdgeSource implements recon.ReconSource against the BinaryEdge
// internet data API. It iterates provider keyword queries and emits a Finding
// per result event.
//
// A missing API key disables the source without error.
type BinaryEdgeSource struct {
APIKey string
BaseURL string
Registry *providers.Registry
Limiters *recon.LimiterRegistry
client *Client
}
// Compile-time assertion.
var _ recon.ReconSource = (*BinaryEdgeSource)(nil)
func (s *BinaryEdgeSource) Name() string { return "binaryedge" }
func (s *BinaryEdgeSource) RateLimit() rate.Limit { return rate.Every(2 * time.Second) }
func (s *BinaryEdgeSource) Burst() int { return 1 }
func (s *BinaryEdgeSource) RespectsRobots() bool { return false }
// Enabled returns true only when APIKey is configured.
func (s *BinaryEdgeSource) Enabled(_ recon.Config) bool { return s.APIKey != "" }
// Sweep issues one BinaryEdge search request per provider keyword and emits
// a Finding for every result event.
func (s *BinaryEdgeSource) Sweep(ctx context.Context, _ string, out chan<- recon.Finding) error {
if s.APIKey == "" {
return nil
}
if s.client == nil {
s.client = NewClient()
}
base := s.BaseURL
if base == "" {
base = "https://api.binaryedge.io"
}
queries := BuildQueries(s.Registry, "binaryedge")
kwIndex := binaryedgeKeywordIndex(s.Registry)
for _, q := range queries {
if err := ctx.Err(); err != nil {
return err
}
if s.Limiters != nil {
if err := s.Limiters.Wait(ctx, s.Name(), s.RateLimit(), s.Burst(), false); err != nil {
return err
}
}
endpoint := fmt.Sprintf("%s/v2/query/search?query=%s&page=1",
base, url.QueryEscape(q))
req, err := http.NewRequestWithContext(ctx, http.MethodGet, endpoint, nil)
if err != nil {
return fmt.Errorf("binaryedge: build request: %w", err)
}
req.Header.Set("X-Key", s.APIKey)
req.Header.Set("Accept", "application/json")
resp, err := s.client.Do(ctx, req)
if err != nil {
if errors.Is(err, ErrUnauthorized) {
return err
}
if errors.Is(err, context.Canceled) || errors.Is(err, context.DeadlineExceeded) {
return err
}
continue
}
var parsed binaryedgeSearchResponse
decErr := json.NewDecoder(resp.Body).Decode(&parsed)
_ = resp.Body.Close()
if decErr != nil {
continue
}
provName := kwIndex[strings.ToLower(q)]
for _, ev := range parsed.Events {
f := recon.Finding{
ProviderName: provName,
Confidence: "low",
Source: fmt.Sprintf("binaryedge://%s:%d", ev.Target.IP, ev.Target.Port),
SourceType: "recon:binaryedge",
DetectedAt: time.Now(),
}
select {
case out <- f:
case <-ctx.Done():
return ctx.Err()
}
}
}
return nil
}
type binaryedgeSearchResponse struct {
Events []binaryedgeEvent `json:"events"`
}
type binaryedgeEvent struct {
Target binaryedgeTarget `json:"target"`
}
type binaryedgeTarget struct {
IP string `json:"ip"`
Port int `json:"port"`
}
// binaryedgeKeywordIndex maps lowercased keywords to provider names.
func binaryedgeKeywordIndex(reg *providers.Registry) map[string]string {
m := make(map[string]string)
if reg == nil {
return m
}
for _, p := range reg.List() {
for _, k := range p.Keywords {
kl := strings.ToLower(strings.TrimSpace(k))
if kl == "" {
continue
}
if _, exists := m[kl]; !exists {
m[kl] = p.Name
}
}
}
return m
}

View File

@@ -0,0 +1,117 @@
package sources
import (
"context"
"encoding/json"
"errors"
"net/http"
"net/http/httptest"
"strings"
"sync/atomic"
"testing"
"time"
"github.com/salvacybersec/keyhunter/pkg/recon"
)
func binaryedgeStubHandler(t *testing.T, calls *int32) http.HandlerFunc {
t.Helper()
return func(w http.ResponseWriter, r *http.Request) {
atomic.AddInt32(calls, 1)
if !strings.HasPrefix(r.URL.Path, "/v2/query/search") {
t.Errorf("unexpected path: %s", r.URL.Path)
}
if got := r.Header.Get("X-Key"); got != "testkey" {
t.Errorf("missing X-Key header: %q", got)
}
body := binaryedgeSearchResponse{
Events: []binaryedgeEvent{
{Target: binaryedgeTarget{IP: "192.168.1.1", Port: 80}},
{Target: binaryedgeTarget{IP: "192.168.1.2", Port: 443}},
},
}
w.Header().Set("Content-Type", "application/json")
_ = json.NewEncoder(w).Encode(body)
}
}
func TestBinaryEdgeSource_EnabledRequiresAPIKey(t *testing.T) {
reg := syntheticRegistry()
lim := recon.NewLimiterRegistry()
s := &BinaryEdgeSource{APIKey: "", Registry: reg, Limiters: lim}
if s.Enabled(recon.Config{}) {
t.Error("expected Enabled=false with empty key")
}
s = &BinaryEdgeSource{APIKey: "key", Registry: reg, Limiters: lim}
if !s.Enabled(recon.Config{}) {
t.Error("expected Enabled=true with key")
}
}
func TestBinaryEdgeSource_SweepEmitsFindings(t *testing.T) {
reg := syntheticRegistry()
lim := recon.NewLimiterRegistry()
_ = lim.For("binaryedge", 1000, 100)
var calls int32
srv := httptest.NewServer(binaryedgeStubHandler(t, &calls))
defer srv.Close()
s := &BinaryEdgeSource{
APIKey: "testkey",
BaseURL: srv.URL,
Registry: reg,
Limiters: lim,
}
out := make(chan recon.Finding, 32)
ctx, cancel := context.WithTimeout(context.Background(), 5*time.Second)
defer cancel()
done := make(chan error, 1)
go func() { done <- s.Sweep(ctx, "", out); close(out) }()
var findings []recon.Finding
for f := range out {
findings = append(findings, f)
}
if err := <-done; err != nil {
t.Fatalf("Sweep error: %v", err)
}
// 2 keywords * 2 events = 4 findings
if len(findings) != 4 {
t.Fatalf("expected 4 findings, got %d", len(findings))
}
for _, f := range findings {
if f.SourceType != "recon:binaryedge" {
t.Errorf("SourceType=%q want recon:binaryedge", f.SourceType)
}
}
if got := atomic.LoadInt32(&calls); got != 2 {
t.Errorf("expected 2 API calls, got %d", got)
}
}
func TestBinaryEdgeSource_CtxCancelled(t *testing.T) {
reg := syntheticRegistry()
lim := recon.NewLimiterRegistry()
_ = lim.For("binaryedge", 1000, 100)
s := &BinaryEdgeSource{
APIKey: "key",
BaseURL: "http://127.0.0.1:1",
Registry: reg,
Limiters: lim,
}
ctx, cancel := context.WithCancel(context.Background())
cancel()
out := make(chan recon.Finding, 1)
err := s.Sweep(ctx, "", out)
if !errors.Is(err, context.Canceled) {
t.Fatalf("expected context.Canceled, got %v", err)
}
}

144
pkg/recon/sources/fofa.go Normal file
View File

@@ -0,0 +1,144 @@
package sources
import (
"context"
"encoding/base64"
"encoding/json"
"errors"
"fmt"
"net/http"
"strings"
"time"
"golang.org/x/time/rate"
"github.com/salvacybersec/keyhunter/pkg/providers"
"github.com/salvacybersec/keyhunter/pkg/recon"
)
// FOFASource implements recon.ReconSource against the FOFA internet search
// engine API. It iterates provider keyword queries and emits a Finding per
// result.
//
// A missing Email or API key disables the source without error.
type FOFASource struct {
Email string
APIKey string
BaseURL string
Registry *providers.Registry
Limiters *recon.LimiterRegistry
client *Client
}
// Compile-time assertion.
var _ recon.ReconSource = (*FOFASource)(nil)
func (s *FOFASource) Name() string { return "fofa" }
func (s *FOFASource) RateLimit() rate.Limit { return rate.Every(1 * time.Second) }
func (s *FOFASource) Burst() int { return 1 }
func (s *FOFASource) RespectsRobots() bool { return false }
// Enabled returns true only when both Email and APIKey are configured.
func (s *FOFASource) Enabled(_ recon.Config) bool { return s.Email != "" && s.APIKey != "" }
// Sweep issues one FOFA search request per provider keyword and emits a
// Finding for every result row.
func (s *FOFASource) Sweep(ctx context.Context, _ string, out chan<- recon.Finding) error {
if s.Email == "" || s.APIKey == "" {
return nil
}
if s.client == nil {
s.client = NewClient()
}
base := s.BaseURL
if base == "" {
base = "https://fofa.info"
}
queries := BuildQueries(s.Registry, "fofa")
kwIndex := fofaKeywordIndex(s.Registry)
for _, q := range queries {
if err := ctx.Err(); err != nil {
return err
}
if s.Limiters != nil {
if err := s.Limiters.Wait(ctx, s.Name(), s.RateLimit(), s.Burst(), false); err != nil {
return err
}
}
qb64 := base64.StdEncoding.EncodeToString([]byte(q))
endpoint := fmt.Sprintf("%s/api/v1/search/all?email=%s&key=%s&qbase64=%s&size=100",
base, s.Email, s.APIKey, qb64)
req, err := http.NewRequestWithContext(ctx, http.MethodGet, endpoint, nil)
if err != nil {
return fmt.Errorf("fofa: build request: %w", err)
}
req.Header.Set("Accept", "application/json")
resp, err := s.client.Do(ctx, req)
if err != nil {
if errors.Is(err, ErrUnauthorized) {
return err
}
if errors.Is(err, context.Canceled) || errors.Is(err, context.DeadlineExceeded) {
return err
}
continue
}
var parsed fofaSearchResponse
decErr := json.NewDecoder(resp.Body).Decode(&parsed)
_ = resp.Body.Close()
if decErr != nil {
continue
}
provName := kwIndex[strings.ToLower(q)]
for _, row := range parsed.Results {
// Each row is [host, ip, port].
if len(row) < 3 {
continue
}
f := recon.Finding{
ProviderName: provName,
Confidence: "low",
Source: fmt.Sprintf("fofa://%s:%s", row[1], row[2]),
SourceType: "recon:fofa",
DetectedAt: time.Now(),
}
select {
case out <- f:
case <-ctx.Done():
return ctx.Err()
}
}
}
return nil
}
type fofaSearchResponse struct {
Results [][]string `json:"results"`
Size int `json:"size"`
}
// fofaKeywordIndex maps lowercased keywords to provider names.
func fofaKeywordIndex(reg *providers.Registry) map[string]string {
m := make(map[string]string)
if reg == nil {
return m
}
for _, p := range reg.List() {
for _, k := range p.Keywords {
kl := strings.ToLower(strings.TrimSpace(k))
if kl == "" {
continue
}
if _, exists := m[kl]; !exists {
m[kl] = p.Name
}
}
}
return m
}

View File

@@ -0,0 +1,130 @@
package sources
import (
"context"
"encoding/json"
"errors"
"net/http"
"net/http/httptest"
"sync/atomic"
"testing"
"time"
"github.com/salvacybersec/keyhunter/pkg/recon"
)
func fofaStubHandler(t *testing.T, calls *int32) http.HandlerFunc {
t.Helper()
return func(w http.ResponseWriter, r *http.Request) {
atomic.AddInt32(calls, 1)
if r.URL.Path != "/api/v1/search/all" {
t.Errorf("unexpected path: %s", r.URL.Path)
}
if got := r.URL.Query().Get("email"); got != "test@example.com" {
t.Errorf("missing email param: %q", got)
}
if got := r.URL.Query().Get("key"); got != "testkey" {
t.Errorf("missing key param: %q", got)
}
body := fofaSearchResponse{
Results: [][]string{
{"example.com", "1.2.3.4", "443"},
{"test.org", "5.6.7.8", "8080"},
},
Size: 2,
}
w.Header().Set("Content-Type", "application/json")
_ = json.NewEncoder(w).Encode(body)
}
}
func TestFOFASource_EnabledRequiresCredentials(t *testing.T) {
reg := syntheticRegistry()
lim := recon.NewLimiterRegistry()
s := &FOFASource{Email: "", APIKey: "", Registry: reg, Limiters: lim}
if s.Enabled(recon.Config{}) {
t.Error("expected Enabled=false with empty credentials")
}
s = &FOFASource{Email: "a@b.com", APIKey: "", Registry: reg, Limiters: lim}
if s.Enabled(recon.Config{}) {
t.Error("expected Enabled=false with empty APIKey")
}
s = &FOFASource{Email: "", APIKey: "key", Registry: reg, Limiters: lim}
if s.Enabled(recon.Config{}) {
t.Error("expected Enabled=false with empty Email")
}
s = &FOFASource{Email: "a@b.com", APIKey: "key", Registry: reg, Limiters: lim}
if !s.Enabled(recon.Config{}) {
t.Error("expected Enabled=true with both credentials")
}
}
func TestFOFASource_SweepEmitsFindings(t *testing.T) {
reg := syntheticRegistry()
lim := recon.NewLimiterRegistry()
_ = lim.For("fofa", 1000, 100)
var calls int32
srv := httptest.NewServer(fofaStubHandler(t, &calls))
defer srv.Close()
s := &FOFASource{
Email: "test@example.com",
APIKey: "testkey",
BaseURL: srv.URL,
Registry: reg,
Limiters: lim,
}
out := make(chan recon.Finding, 32)
ctx, cancel := context.WithTimeout(context.Background(), 5*time.Second)
defer cancel()
done := make(chan error, 1)
go func() { done <- s.Sweep(ctx, "", out); close(out) }()
var findings []recon.Finding
for f := range out {
findings = append(findings, f)
}
if err := <-done; err != nil {
t.Fatalf("Sweep error: %v", err)
}
// 2 keywords * 2 results = 4 findings
if len(findings) != 4 {
t.Fatalf("expected 4 findings, got %d", len(findings))
}
for _, f := range findings {
if f.SourceType != "recon:fofa" {
t.Errorf("SourceType=%q want recon:fofa", f.SourceType)
}
}
if got := atomic.LoadInt32(&calls); got != 2 {
t.Errorf("expected 2 API calls, got %d", got)
}
}
func TestFOFASource_CtxCancelled(t *testing.T) {
reg := syntheticRegistry()
lim := recon.NewLimiterRegistry()
_ = lim.For("fofa", 1000, 100)
s := &FOFASource{
Email: "a@b.com",
APIKey: "key",
BaseURL: "http://127.0.0.1:1",
Registry: reg,
Limiters: lim,
}
ctx, cancel := context.WithCancel(context.Background())
cancel()
out := make(chan recon.Finding, 1)
err := s.Sweep(ctx, "", out)
if !errors.Is(err, context.Canceled) {
t.Fatalf("expected context.Canceled, got %v", err)
}
}

147
pkg/recon/sources/netlas.go Normal file
View File

@@ -0,0 +1,147 @@
package sources
import (
"context"
"encoding/json"
"errors"
"fmt"
"net/http"
"net/url"
"strings"
"time"
"golang.org/x/time/rate"
"github.com/salvacybersec/keyhunter/pkg/providers"
"github.com/salvacybersec/keyhunter/pkg/recon"
)
// NetlasSource implements recon.ReconSource against the Netlas internet
// intelligence API. It iterates provider keyword queries and emits a Finding
// per result item.
//
// A missing API key disables the source without error.
type NetlasSource struct {
APIKey string
BaseURL string
Registry *providers.Registry
Limiters *recon.LimiterRegistry
client *Client
}
// Compile-time assertion.
var _ recon.ReconSource = (*NetlasSource)(nil)
func (s *NetlasSource) Name() string { return "netlas" }
func (s *NetlasSource) RateLimit() rate.Limit { return rate.Every(1 * time.Second) }
func (s *NetlasSource) Burst() int { return 1 }
func (s *NetlasSource) RespectsRobots() bool { return false }
// Enabled returns true only when APIKey is configured.
func (s *NetlasSource) Enabled(_ recon.Config) bool { return s.APIKey != "" }
// Sweep issues one Netlas search request per provider keyword and emits a
// Finding for every result item.
func (s *NetlasSource) Sweep(ctx context.Context, _ string, out chan<- recon.Finding) error {
if s.APIKey == "" {
return nil
}
if s.client == nil {
s.client = NewClient()
}
base := s.BaseURL
if base == "" {
base = "https://app.netlas.io"
}
queries := BuildQueries(s.Registry, "netlas")
kwIndex := netlasKeywordIndex(s.Registry)
for _, q := range queries {
if err := ctx.Err(); err != nil {
return err
}
if s.Limiters != nil {
if err := s.Limiters.Wait(ctx, s.Name(), s.RateLimit(), s.Burst(), false); err != nil {
return err
}
}
endpoint := fmt.Sprintf("%s/api/responses/?q=%s&start=0&indices=",
base, url.QueryEscape(q))
req, err := http.NewRequestWithContext(ctx, http.MethodGet, endpoint, nil)
if err != nil {
return fmt.Errorf("netlas: build request: %w", err)
}
req.Header.Set("X-API-Key", s.APIKey)
req.Header.Set("Accept", "application/json")
resp, err := s.client.Do(ctx, req)
if err != nil {
if errors.Is(err, ErrUnauthorized) {
return err
}
if errors.Is(err, context.Canceled) || errors.Is(err, context.DeadlineExceeded) {
return err
}
continue
}
var parsed netlasSearchResponse
decErr := json.NewDecoder(resp.Body).Decode(&parsed)
_ = resp.Body.Close()
if decErr != nil {
continue
}
provName := kwIndex[strings.ToLower(q)]
for _, item := range parsed.Items {
f := recon.Finding{
ProviderName: provName,
Confidence: "low",
Source: fmt.Sprintf("netlas://%s:%d", item.Data.IP, item.Data.Port),
SourceType: "recon:netlas",
DetectedAt: time.Now(),
}
select {
case out <- f:
case <-ctx.Done():
return ctx.Err()
}
}
}
return nil
}
type netlasSearchResponse struct {
Items []netlasItem `json:"items"`
}
type netlasItem struct {
Data netlasData `json:"data"`
}
type netlasData struct {
IP string `json:"ip"`
Port int `json:"port"`
}
// netlasKeywordIndex maps lowercased keywords to provider names.
func netlasKeywordIndex(reg *providers.Registry) map[string]string {
m := make(map[string]string)
if reg == nil {
return m
}
for _, p := range reg.List() {
for _, k := range p.Keywords {
kl := strings.ToLower(strings.TrimSpace(k))
if kl == "" {
continue
}
if _, exists := m[kl]; !exists {
m[kl] = p.Name
}
}
}
return m
}

View File

@@ -0,0 +1,117 @@
package sources
import (
"context"
"encoding/json"
"errors"
"net/http"
"net/http/httptest"
"strings"
"sync/atomic"
"testing"
"time"
"github.com/salvacybersec/keyhunter/pkg/recon"
)
func netlasStubHandler(t *testing.T, calls *int32) http.HandlerFunc {
t.Helper()
return func(w http.ResponseWriter, r *http.Request) {
atomic.AddInt32(calls, 1)
if !strings.HasPrefix(r.URL.Path, "/api/responses/") {
t.Errorf("unexpected path: %s", r.URL.Path)
}
if got := r.Header.Get("X-API-Key"); got != "testkey" {
t.Errorf("missing X-API-Key header: %q", got)
}
body := netlasSearchResponse{
Items: []netlasItem{
{Data: netlasData{IP: "10.0.0.1", Port: 443}},
{Data: netlasData{IP: "10.0.0.2", Port: 8443}},
},
}
w.Header().Set("Content-Type", "application/json")
_ = json.NewEncoder(w).Encode(body)
}
}
func TestNetlasSource_EnabledRequiresAPIKey(t *testing.T) {
reg := syntheticRegistry()
lim := recon.NewLimiterRegistry()
s := &NetlasSource{APIKey: "", Registry: reg, Limiters: lim}
if s.Enabled(recon.Config{}) {
t.Error("expected Enabled=false with empty key")
}
s = &NetlasSource{APIKey: "key", Registry: reg, Limiters: lim}
if !s.Enabled(recon.Config{}) {
t.Error("expected Enabled=true with key")
}
}
func TestNetlasSource_SweepEmitsFindings(t *testing.T) {
reg := syntheticRegistry()
lim := recon.NewLimiterRegistry()
_ = lim.For("netlas", 1000, 100)
var calls int32
srv := httptest.NewServer(netlasStubHandler(t, &calls))
defer srv.Close()
s := &NetlasSource{
APIKey: "testkey",
BaseURL: srv.URL,
Registry: reg,
Limiters: lim,
}
out := make(chan recon.Finding, 32)
ctx, cancel := context.WithTimeout(context.Background(), 5*time.Second)
defer cancel()
done := make(chan error, 1)
go func() { done <- s.Sweep(ctx, "", out); close(out) }()
var findings []recon.Finding
for f := range out {
findings = append(findings, f)
}
if err := <-done; err != nil {
t.Fatalf("Sweep error: %v", err)
}
// 2 keywords * 2 items = 4 findings
if len(findings) != 4 {
t.Fatalf("expected 4 findings, got %d", len(findings))
}
for _, f := range findings {
if f.SourceType != "recon:netlas" {
t.Errorf("SourceType=%q want recon:netlas", f.SourceType)
}
}
if got := atomic.LoadInt32(&calls); got != 2 {
t.Errorf("expected 2 API calls, got %d", got)
}
}
func TestNetlasSource_CtxCancelled(t *testing.T) {
reg := syntheticRegistry()
lim := recon.NewLimiterRegistry()
_ = lim.For("netlas", 1000, 100)
s := &NetlasSource{
APIKey: "key",
BaseURL: "http://127.0.0.1:1",
Registry: reg,
Limiters: lim,
}
ctx, cancel := context.WithCancel(context.Background())
cancel()
out := make(chan recon.Finding, 1)
err := s.Sweep(ctx, "", out)
if !errors.Is(err, context.Canceled) {
t.Fatalf("expected context.Canceled, got %v", err)
}
}