instagram-attack/config.yml at master · nickmflorin/instagram-attack · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
### Instattack Configuration Settings
### TODO: Turn Into Python File

instattack:
    debug: true

    log.logging:
        level: 'debug'
        log_request_errors: true
        log_proxy_queue: true

connection:
    limit_per_host: 0
    connection_timeout: 14
    connection_limit: 0


login:

    passwords:
        # The number of concurrent passwords to try at the same time.
        passwords_batch_size: 10

        generator:
            # TODO: Add validation to make sure all elements of nested lists are
            # integers.
            capitalize_at_indices: [0, 1, [0, 1]]

            alterations:
                before: false
                after: true

            numerics:
                before: false
                after: true
                birthday:
                    provided: true
                    all: false
                    # TODO: Make required based on the value of `all`.
                    start_year: 1991
                    end_year: 2000

    attempts:
        # The number of concurrent requests to make for each password.
        attempts_batch_size: 20
        save_method: 'end'


proxies:
    save_method: 'end'
    countries: ['US']

    train:
        batch_size: 50
        # timeout: 10  # Replaces Timeout for Connection

    # Settings Here Only Matter if Collect = True
    # Do we want to add a limit to the broker collection?
    broker:
        # The maximum number of concurrent checks of proxies
        broker_max_conn: 200

        # The maximum number of attempts to check a proxy
        # Note that the lower the value of max_tries, the faster the broker will return
        # proxies, but they will not contain as much information to gauge their
        # relative reliability and speed.
        broker_max_tries: 2

        # Maximum amount of time to wait for broker to return a proxy before failing.
        broker_timeout: 5

    pool:
        # The maximum amount of time to wait for a proxy from the queue before failing.
        pool_timeout: 10
        collect: false

        # 3 Purposes:
        #   (1) Initial Population of Confirmed Queue
        #   (2) Whether or Not Evaluation Can be Ignored
        #   (3) Whether or not Error Causes Confirmed Proxy to be Removed

        # Right now this checks if both are satisfied, but we might want the ability
        # to check if either is specified, and over what range.
        confirmation:
            threshold: 2
            horizon: 5
            threshold_in_horizon: 1

        # We do not need the confirmed fields since they already are factored
        # in based on the separate queues.
        priority: [
            [-1, ['requests', 'active', 'success']],
            [1, ['error_rate', 'active']],
            [-1, ['requests', 'historical', 'success']],
            [1, ['error_rate', 'historical']],
            [1, ['avg_resp_time']]
        ]

        # The amount of time to wait before using a proxy that raises an error
        # that does not indicate an invalid proxy.
        # Each additional increment is calculated as increment = start*e^(c*x), where
        # x is the number of times the request has failed consecutively.
        # After the max value has been reached via incrementation, the
        # proxy will be discarded.
        timeouts:
            too_many_requests:
                increment: 5
                start: 5
                max: 40

            too_many_open_connections:
                increment: 5
                start: 5
                max: 40

        limits:
            # The maximum response time in seconds. If proxy.avg_resp_time exceeds this
            # value, proxy will be removed from the pool.
            # TODO: Allow Historical & Current
            resp_time: null

            # The maxmium number of allowed requests for each proxy per attack, before
            # being removed from pool.  For LARGER attacks, this should probably be
            # negated, since we do not want to discard good proxies.
            requests:
                all:
                    historical: null
                    active: null
                success:
                    historical: null
                    active: null
                fail:
                    historical: null
                    active: null

            # The maximum overall error rate for a proxy to be put into or used from
            # the pool.
            # TODO: Start Measuring Historical & Active
            error_rate:
                historical: null
                active: null
                # The minimum number of requests required before error rate is non-zero.
                horizon: 5

            # The maximum number of allowed errors for a proxy before being
            # removed from the pool or not included in pool to begin with.
            errors:
                # Right now, too_many_requests counts as a general error, so
                # we probably do not want to limit the number of total errors.
                # We need to treat too_many_requests as a warning.
                # all:
                #     historical: 2
                #     active: 1
                connection:
                    historical: 2
                    active: 1
                response:
                    historical: 2
                    active: 1
                instagram:
                    historical: 1
                    active: 1
                ssl:
                    historical: 3
                    active: 2
                timeout:
                    # There seem to be a lot of proxies that do get confirmed results
                    # but also have a lot of historical timeout errors.
                    historical: 4
                    active: 2