Blackjack-Strategy-Simulator/expected_value.py at main · AttackingOrDefending/Blackjack-Strategy-Simulator · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
"""Estimate the expected value of a given strategy."""
from __future__ import annotations
from utils import get_cards_seen, DECK, readable_number
from action_strategies import BaseMover
from betting_strategies import BaseBetter
from collections import deque
from typing import Iterable
import matplotlib.pyplot as plt
import random
import betting_strategies
import action_strategies
import argparse
import multiprocessing


class Hand:
    """Hold information about the hand of the player and the dealer."""

    def __init__(self, cards: Iterable[int]) -> None:
        """
        Save the initial cards.

        :param cards: The cards the hand started with.
        """
        self.cards = list(cards)

    def add_card(self, card: int) -> None:
        """
        Add a new card to the hand.

        :param card: The new card to add for the hand (an ace is symbolised as 11).
        """
        self.cards.append(card)

    def value_ace(self) -> tuple[int, int]:
        """
        Return the value of a hand and how many aces that count as 11 it has.

        :return: The hand's value and how many aces are counted as 11 (0 or 1).
        """
        value = sum(self.cards)
        aces = self.cards.count(11)
        while value > 21 and aces:
            value -= 10
            aces -= 1
        return value, aces

    def aces(self) -> int:
        """
        Return the number of aces that count as 11.

        :return: The number of aces counted as 11.
        """
        return self.value_ace()[1]

    def value(self) -> int:
        """
        Return the value of a hand.

        :return: The hand's value.
        """
        return self.value_ace()[0]


def get_card_from_shoe(shoe: list[int]) -> int:
    """
    Get a card from the shoe. Always returns the last item from the shoe, so the shoe must be shuffled before.

    :param shoe: The shoe to get a card from.
    :return: The card we got from the shoe.
    """
    card = shoe.pop()
    return card


def get_mover_and_better(mover_name: str, better_name: str
                         ) -> tuple[action_strategies.BaseMover, betting_strategies.BaseBetter]:
    """
    Get the mover and the better from the arguments passed by the user.

    :param mover_name: The name of the mover to use. If it isn't one of the recognized names,
        then in checks if there is a class of that name.
    :param better_name: The name of the better to use. If it isn't one of the recognized names,
        then in checks if there is a class of that name.
    :return: The mover and the better to use, already set up.
    """
    mover_class: action_strategies.BaseMover
    better_class: betting_strategies.BaseBetter
    if mover_name == "card-count":
        mover_class = action_strategies.CardCountMover(
            {(-1000, -10): "data/6deck_s17_das_peek_tc_minus_10.csv",
             (-10, -9): "data/6deck_s17_das_peek_tc_minus_9.csv",
             (-9, -8): "data/6deck_s17_das_peek_tc_minus_8.csv",
             (-8, -7): "data/6deck_s17_das_peek_tc_minus_7.csv",
             (-7, -6): "data/6deck_s17_das_peek_tc_minus_6.csv",
             (-6, -5): "data/6deck_s17_das_peek_tc_minus_5.csv",
             (-5, -4): "data/6deck_s17_das_peek_tc_minus_4.csv",
             (-4, -3): "data/6deck_s17_das_peek_tc_minus_3.csv",
             (-3, -2): "data/6deck_s17_das_peek_tc_minus_2.csv",
             (-2, -1): "data/6deck_s17_das_peek_tc_minus_1.csv",
             (-1, 1): "data/6deck_s17_das_peek_tc_0.csv",
             (1, 2): "data/6deck_s17_das_peek_tc_plus_1.csv",
             (2, 3): "data/6deck_s17_das_peek_tc_plus_2.csv",
             (3, 4): "data/6deck_s17_das_peek_tc_plus_3.csv",
             (4, 5): "data/6deck_s17_das_peek_tc_plus_4.csv",
             (5, 6): "data/6deck_s17_das_peek_tc_plus_5.csv",
             (6, 7): "data/6deck_s17_das_peek_tc_plus_6.csv",
             (7, 8): "data/6deck_s17_das_peek_tc_plus_7.csv",
             (8, 9): "data/6deck_s17_das_peek_tc_plus_8.csv",
             (9, 10): "data/6deck_s17_das_peek_tc_plus_9.csv",
             (10, 1000): "data/6deck_s17_das_peek_tc_plus_10.csv"})
    elif mover_name == "basic-strategy-deviations":
        mover_class = action_strategies.BasicStrategyDeviationsMover("data/6deck_s17_das_peek_basic_strategy.csv")
    elif mover_name == "basic-strategy":
        mover_class = action_strategies.BasicStrategyMover("data/6deck_s17_das_peek_basic_strategy.csv")
    elif mover_name == "perfect":
        mover_class = action_strategies.PerfectMover()
    elif mover_name == "simple":
        mover_class = action_strategies.SimpleMover()
    else:  # Run a user-defined class.
        mover_class = getattr(action_strategies, mover_name)()
    if better_name == "card-count":
        better_class = betting_strategies.CardCountBetter()
    elif better_name == "conservative-card-count":
        better_class = betting_strategies.ConservativeCardCountBetter()
    elif better_name == "wonging-card-count":
        better_class = betting_strategies.WongingCardCountBetter()
    elif better_name == "wonging-conservative-card-count":
        better_class = betting_strategies.WongingConservativeCardCountBetter()
    elif better_name == "simple":
        better_class = betting_strategies.SimpleBetter()
    else:  # Run a user-defined class.
        better_class = getattr(betting_strategies, better_name)()
    return mover_class, better_class


def play_dealer(dealer_cards: Iterable[int], shoe: list[int], dealer_stands_soft_17: bool) -> int:
    """
    Play the dealers hand to get its final value.

    :param dealer_cards: The cards the dealer already has.
    :param shoe: The shoe.
    :param dealer_stands_soft_17: Whether the dealer stands on soft 17.
    :return: The final value of the dealer's hand. If the dealer busted, the value is 0.
    """
    dealer = Hand(dealer_cards)
    while dealer.value() < 17 or not dealer_stands_soft_17 and dealer.value() == 17 and dealer.aces():
        dealer.add_card(get_card_from_shoe(shoe))
    dealer_value = dealer.value()
    return dealer_value if dealer_value <= 21 else 0


def play_hand(action_class: action_strategies.BaseMover,
              hand_cards: list[list[int]], dealer_up_card: int, dealer_down_card: int, shoe: list[int],
              splits_remaining: int, deck_number: int, dealer_peeks_for_blackjack: bool = True, das: bool = True,
              dealer_stands_soft_17: bool = True) -> tuple[list[list[int]], int]:
    """
    Play hands but don't play the dealer.

    :param action_class: The class that chooses the action.
    :param hand_cards: The cards in our hand.
    :param dealer_up_card: The dealer's up card.
    :param dealer_down_card: The dealer's down card.
    :param shoe: The shoe.
    :param splits_remaining: How many more splits we can do.
    :param deck_number: The number of decks in the initial shoe.
    :param dealer_peeks_for_blackjack: Whether the dealer peeks for blackjack.
    :param das: Whether we can double after splitting.
    :param dealer_stands_soft_17: Whether the dealer stands on soft 17.
    :return: The hands played out.
    """
    splits_used = 0
    done_hands = []
    for hand_index, cards in enumerate(hand_cards):
        if Hand(cards).value() > 21:
            done_hands.append(cards)
            continue
        can_split = (splits_remaining > 0 and len(cards) == 2 and cards[0] == cards[1]
                     and (not cards[0] == 11 or splits_remaining == 3))
        can_double = len(cards) == 2 and (das or splits_remaining == 3)
        cards_seen = get_cards_seen(deck_number, shoe)
        cards_seen.remove(dealer_down_card)
        hand = Hand(cards)
        initial_hand_value, initial_hand_has_ace = hand.value_ace()
        action, insure = action_class.get_move(initial_hand_value, bool(initial_hand_has_ace), dealer_up_card,
                                               can_double,
                                               can_split, False, False, cards, cards_seen, deck_number,
                                               dealer_peeks_for_blackjack, das, dealer_stands_soft_17)

        if action == "s":
            done_hands.append(cards)

        elif action == "d" and can_double:
            card = get_card_from_shoe(shoe)
            hand.add_card(card)
            done_hands.append(hand.cards)
            done_hands.append(hand.cards)  # Add the same hand twice instead of doubling the bet.

        elif action == "h":
            card = get_card_from_shoe(shoe)
            hand.add_card(card)
            hand_cards, _ = play_hand(action_class, [hand.cards], dealer_up_card, dealer_down_card, shoe,
                                      0, deck_number, dealer_peeks_for_blackjack, das,
                                      dealer_stands_soft_17)
            done_hands.append(hand_cards[0])

        elif action == "p" and can_split:
            splits_used += 1
            hand1 = Hand([hand.cards[0]])
            hand2 = Hand([hand.cards[1]])
            card1 = get_card_from_shoe(shoe)
            hand1.add_card(card1)
            done_split_hands, splits_used_first_hand = play_hand(action_class, [hand1.cards], dealer_up_card,
                                                                 dealer_down_card, shoe, splits_remaining - 1, deck_number,
                                                                 dealer_peeks_for_blackjack, das, dealer_stands_soft_17)
            done_hands.extend(done_split_hands)
            splits_used += splits_used_first_hand
            card2 = get_card_from_shoe(shoe)
            hand2.add_card(card2)
            done_split_hands, splits_used_second_hand = play_hand(action_class, [hand2.cards] + hand_cards[hand_index + 1:],
                                                                  dealer_up_card, dealer_down_card, shoe,
                                                                  splits_remaining - splits_used, deck_number,
                                                                  dealer_peeks_for_blackjack, das, dealer_stands_soft_17)
            done_hands.extend(done_split_hands)
            splits_used += splits_used_second_hand
            break

        else:
            raise ValueError(f"invalid action: {action}.")
    return done_hands, splits_used


def simulate_hand(action_class: action_strategies.BaseMover,
                  cards: list[int], dealer_up_card: int,
                  dealer_down_card: int, shoe: list[int],
                  splits_remaining: int, deck_number: int, dealer_peeks_for_blackjack: bool = True, das: bool = True,
                  dealer_stands_soft_17: bool = True, surrender_allowed: bool = True) -> float:
    """
    Play one hand.

    :param action_class: The class that chooses the action.
    :param cards: The cards in our hand.
    :param dealer_up_card: The dealer's up card.
    :param dealer_down_card: The dealer's down card.
    :param shoe: The shoe.
    :param splits_remaining: How many more splits we can do.
    :param deck_number: The number of decks in the initial shoe.
    :param dealer_peeks_for_blackjack: Whether the dealer peeks for blackjack.
    :param das: Whether we can double after splitting.
    :param dealer_stands_soft_17: Whether the dealer stands on soft 17.
    :param surrender_allowed: Whether the game rules allow surrendering.
    :return: The profit/loss from the hand, and how many times we split.
    """
    can_split = (splits_remaining > 0 and len(cards) == 2 and cards[0] == cards[1]
                 and (not cards[0] == 11 or splits_remaining == 3))
    can_double = len(cards) == 2 and (das or splits_remaining == 3)
    can_surrender_now = surrender_allowed
    can_insure = dealer_up_card == 11
    insurance_profit = 0.
    dealer_has_blackjack = dealer_up_card + dealer_down_card == 21
    player_has_blackjack = cards[0] + cards[1] == 21
    player_loses_all_bets = dealer_has_blackjack and not dealer_peeks_for_blackjack and not player_has_blackjack
    cards_seen = get_cards_seen(deck_number, shoe)
    cards_seen.remove(dealer_down_card)
    hand = Hand(cards)
    initial_hand_value, initial_hand_has_ace = hand.value_ace()
    action, insure = action_class.get_move(initial_hand_value, bool(initial_hand_has_ace), dealer_up_card, can_double,
                                           can_split, can_surrender_now, can_insure, cards, cards_seen, deck_number,
                                           dealer_peeks_for_blackjack, das, dealer_stands_soft_17)

    if insure and can_insure:
        insurance_profit = 1 if dealer_down_card == 10 else -.5

    if dealer_peeks_for_blackjack:
        if dealer_has_blackjack and player_has_blackjack:  # Push
            return 0 + insurance_profit
        elif dealer_has_blackjack:  # Dealer blackjack
            return -1 + insurance_profit
        elif player_has_blackjack:  # Player blackjack
            return 1 * 3 / 2 + insurance_profit
    else:
        if player_has_blackjack and dealer_has_blackjack:
            return 0 + insurance_profit
        elif player_has_blackjack:
            return 1 * 3 / 2 + insurance_profit

    if action == "u" and can_surrender_now:
        return -.5 + insurance_profit

    elif action == "s":
        dealer_value = play_dealer((dealer_up_card, dealer_down_card), shoe, dealer_stands_soft_17)
        if player_loses_all_bets:
            return -1 + insurance_profit
        if initial_hand_value > dealer_value:
            return 1 + insurance_profit
        elif initial_hand_value < dealer_value:
            return -1 + insurance_profit
        return 0 + insurance_profit

    elif action == "d" and can_double:
        card = get_card_from_shoe(shoe)
        hand.add_card(card)
        if player_loses_all_bets:
            return -2 + insurance_profit
        if hand.value() > 21:
            return -2 + insurance_profit
        dealer_value = play_dealer((dealer_up_card, dealer_down_card), shoe, dealer_stands_soft_17)
        if hand.value() > dealer_value:
            return +2 + insurance_profit
        elif hand.value() < dealer_value:
            return -2 + insurance_profit
        return 0 + insurance_profit

    elif action == "h":
        card = get_card_from_shoe(shoe)
        hand.add_card(card)
        if player_loses_all_bets:
            return -1 + insurance_profit
        if hand.value() > 21:
            return -1 + insurance_profit
        hands, _ = play_hand(action_class, [hand.cards], dealer_up_card, dealer_down_card, shoe,
                             splits_remaining, deck_number, dealer_peeks_for_blackjack, das, dealer_stands_soft_17)
        hand = Hand(hands[0])
        dealer_value = play_dealer((dealer_up_card, dealer_down_card), shoe, dealer_stands_soft_17)
        if hand.value() > 21 or dealer_value > hand.value():
            return -1 + insurance_profit
        elif hand.value() > dealer_value:
            return 1 + insurance_profit
        return 0 + insurance_profit

    elif action == "p" and can_split:
        hand1 = Hand([hand.cards[0]])
        hand2 = Hand([hand.cards[1]])
        if hand.cards[0] == 11:
            card = get_card_from_shoe(shoe)
            hand1.add_card(card)
            card = get_card_from_shoe(shoe)
            hand2.add_card(card)
            if player_loses_all_bets:
                return -2 + insurance_profit
            dealer_value = play_dealer((dealer_up_card, dealer_down_card), shoe, dealer_stands_soft_17)
            split_profit = 0
            if hand1.value() > 21 or dealer_value > hand1.value():
                split_profit -= 1
            elif hand1.value() > dealer_value:
                split_profit += 1
            if hand2.value() > 21 or dealer_value > hand2.value():
                split_profit -= 1
            elif hand2.value() > dealer_value:
                split_profit += 1
            return split_profit + insurance_profit
        card1 = get_card_from_shoe(shoe)
        hand1.add_card(card1)
        all_hands, splits_used = play_hand(action_class, [hand1.cards], dealer_up_card, dealer_down_card, shoe,
                                           splits_remaining - 1, deck_number, dealer_peeks_for_blackjack, das,
                                           dealer_stands_soft_17)
        card2 = get_card_from_shoe(shoe)
        hand2.add_card(card2)
        done_hands, _ = play_hand(action_class, [hand2.cards], dealer_up_card, dealer_down_card, shoe,
                                  splits_remaining - 1 - splits_used, deck_number, dealer_peeks_for_blackjack, das,
                                  dealer_stands_soft_17)
        all_hands += done_hands
        if player_loses_all_bets:
            return -len(all_hands) + insurance_profit
        dealer_value = play_dealer((dealer_up_card, dealer_down_card), shoe, dealer_stands_soft_17)
        split_profit = 0
        for hand_cards in all_hands:
            hand = Hand(hand_cards)
            if hand.value() > 21 or dealer_value > hand.value():
                split_profit -= 1
            elif hand.value() > dealer_value:
                split_profit += 1
        return split_profit + insurance_profit

    raise ValueError(f"invalid action: {action}.")


def expected_value(action_class: action_strategies.BaseMover, betting_class: betting_strategies.BaseBetter,
                   simulations: int, deck_number: int = 6, shoe_penetration: float = .25,
                   dealer_peeks_for_blackjack: bool = True, das: bool = True,
                   dealer_stands_soft_17: bool = True, surrender_allowed: bool = True,
                   units: int = 200, hands_played: int = 1000,
                   plot_profits: bool = True, print_info: bool = True) -> tuple[float, float, float, float, float]:
    """
    Estimate the expected value of a strategy.

    :param action_class: The class that chooses the action.
    :param betting_class: The class that chooses the bet.
    :param simulations: How many hands to play.
    :param deck_number: The number of decks in the initial shoe.
    :param shoe_penetration: When to reshuffle the shoe. Reshuffles when cards remaining < starting cards * deck penetration.
    :param dealer_peeks_for_blackjack: Whether the dealer peeks for blackjack.
    :param das: Whether we can double after splitting.
    :param dealer_stands_soft_17: Whether the dealer stands on soft 17.
    :param surrender_allowed: Whether the game rules allow surrendering.
    :param units: The number of units in total.
    :param hands_played: How many hands to play before checking the risk of ruin.
    :param plot_profits: Whether a plot showing how the profit changed over time should be made at the end.
    :param print_info: Whether to print information about the progress of the simulation. Disabled for multithreading.
    :return: The total return, the average return of a game, the average bet size, and the risk of ruin.
    """
    starting_shoe = DECK * deck_number
    starting_number = len(starting_shoe)
    reshuffle_at = int(starting_number * shoe_penetration)
    shoe = starting_shoe.copy()
    random.shuffle(shoe)
    profit = 0.
    profits_over_time_hand = [profit]
    bets = []
    for i in range(simulations):
        if print_info and i % 10_000 == 0:
            print(f"Games played: {readable_number(i)}/{readable_number(simulations)}")
        while len(shoe) >= reshuffle_at:
            cards_seen = get_cards_seen(deck_number, shoe)
            initial_bet = betting_class.get_bet(cards_seen, deck_number)
            player_cards = [get_card_from_shoe(shoe)]
            dealer_up_card = get_card_from_shoe(shoe)
            player_cards.append(get_card_from_shoe(shoe))
            dealer_down_card = get_card_from_shoe(shoe)

            cards_seen.extend([dealer_up_card] + player_cards)

            reward = simulate_hand(action_class, player_cards, dealer_up_card,
                                   dealer_down_card, shoe, 3, deck_number,
                                   dealer_peeks_for_blackjack, das, dealer_stands_soft_17, surrender_allowed)
            reward *= initial_bet
            profit += reward
            bets.append(initial_bet)
            profits_over_time_hand.append(profit)

        shoe = starting_shoe.copy()
        random.shuffle(shoe)

    total_bets = sum(bets)
    avg_profit = profit / total_bets if total_bets else 0
    avg_bet = total_bets / len(bets)
    non_zero_bets = [b for b in bets if b > 0]
    if not non_zero_bets:
        non_zero_bets = [0]
    avg_non_zero_bet = sum(non_zero_bets) / len(non_zero_bets)

    risk_of_ruin_count = 0
    total_sims = len(profits_over_time_hand)
    deque_min: deque[int] = deque()
    for index, profit in enumerate(profits_over_time_hand):
        while deque_min and deque_min[0] < index - hands_played + 1:
            deque_min.popleft()
        while deque_min and profits_over_time_hand[deque_min[-1]] >= profit:
            deque_min.pop()
        deque_min.append(index)
        if index >= hands_played - 1:
            if profits_over_time_hand[deque_min[0]] <= profit - units:
                risk_of_ruin_count += 1
    risk_of_ruin = risk_of_ruin_count / (total_sims - hands_played + 1) if total_sims >= hands_played else float("nan")

    if print_info:
        print(f"Total profit: {profit}, Average profit: {avg_profit}, Average bet: {avg_bet}, "
              f"Average bet (if Wonging): {avg_non_zero_bet}, Risk of ruin: {risk_of_ruin}")
    if plot_profits:
        plt.plot(profits_over_time_hand, label="Total profit")
        plt.xlabel("Hands played")
        plt.ylabel("Total profit")
        plt.title("Profits over time")
        plt.legend()
        plt.show()

    return profit, avg_profit, avg_bet, avg_non_zero_bet, risk_of_ruin


def _expected_value_multithreading_wrapper(results: multiprocessing.Queue[tuple[float, float, float, float, float]],
                                           action_class: action_strategies.BaseMover,
                                           betting_class: betting_strategies.BaseBetter,
                                           simulations: int, deck_number: int = 6, shoe_penetration: float = .25,
                                           dealer_peeks_for_blackjack: bool = True, das: bool = True,
                                           dealer_stands_soft_17: bool = True, surrender_allowed: bool = True,
                                           units: int = 200, hands_played: int = 1000) -> None:
    """
    Estimate the expected value of a strategy. Used inside multithreading. Don't use this function directly.

    :param action_class: The class that chooses the action.
    :param betting_class: The class that chooses the bet.
    :param simulations: How many hands to play.
    :param deck_number: The number of decks in the initial shoe.
    :param shoe_penetration: When to reshuffle the shoe. Reshuffles when cards remaining < starting cards * deck penetration.
    :param dealer_peeks_for_blackjack: Whether the dealer peeks for blackjack.
    :param das: Whether we can double after splitting.
    :param dealer_stands_soft_17: Whether the dealer stands on soft 17.
    :param surrender_allowed: Whether the game rules allow surrendering.
    :param units: The number of units in total.
    :param hands_played: How many hands to play before checking the risk of ruin.
    """
    results.put(expected_value(action_class, betting_class, simulations, deck_number, shoe_penetration,
                               dealer_peeks_for_blackjack, das, dealer_stands_soft_17, surrender_allowed,
                               units, hands_played, False, False))


def expected_value_multithreading(action_class: action_strategies.BaseMover, betting_class: betting_strategies.BaseBetter,
                                  total_simulations: int, cores: int = 2, deck_number: int = 6, shoe_penetration: float = .25,
                                  dealer_peeks_for_blackjack: bool = True, das: bool = True,
                                  dealer_stands_soft_17: bool = True, surrender_allowed: bool = True,
                                  units: int = 200, hands_played: int = 1000) -> tuple[float, float, float, float]:
    """
    Estimate the expected value of a strategy, using multithreading to speed up the process. Can't plot the results.

    :param action_class: The class that chooses the action.
    :param betting_class: The class that chooses the bet.
    :param total_simulations: How many hands to play in total.
    :param cores: How many cores to use for the simulation.
    :param deck_number: The number of decks in the initial shoe.
    :param shoe_penetration: When to reshuffle the shoe. Reshuffles when cards remaining < starting cards * deck penetration.
    :param dealer_peeks_for_blackjack: Whether the dealer peeks for blackjack.
    :param das: Whether we can double after splitting.
    :param dealer_stands_soft_17: Whether the dealer stands on soft 17.
    :param surrender_allowed: Whether the game rules allow surrendering.
    :param units: The number of units in total.
    :param hands_played: How many hands to play before checking the risk of ruin.
    :return: The total return, the average return of a game, the average bet size, and the risk of ruin.
    """
    core_results: multiprocessing.Queue[tuple[float, float, float, float, float]] = multiprocessing.Queue()
    worker_pool = []
    for _ in range(cores):
        p = multiprocessing.Process(target=_expected_value_multithreading_wrapper,
                                    args=(core_results, action_class, betting_class, total_simulations // cores,
                                          deck_number, shoe_penetration, dealer_peeks_for_blackjack, das,
                                          dealer_stands_soft_17, surrender_allowed, units, hands_played))
        p.start()
        worker_pool.append(p)
    for p in worker_pool:
        p.join()  # Wait for all the workers to finish.
    profit = 0.
    avg_profit = 0.
    avg_bet = 0.
    avg_non_zero_bet = 0.
    avg_risk_of_ruin = 0.
    for _ in range(cores):
        profit_core, avg_profit_core, avg_bet_core, avg_non_zero_bet_core, risk_of_ruin = core_results.get()
        profit += profit_core
        avg_profit += avg_profit_core
        avg_bet += avg_bet_core
        avg_non_zero_bet += avg_non_zero_bet_core
        avg_risk_of_ruin += risk_of_ruin
    avg_bet /= cores
    avg_non_zero_bet /= cores
    avg_profit /= cores
    avg_risk_of_ruin /= cores
    print(f"Total profit: {profit}, Average profit: {avg_profit}, Average bet: {avg_bet}, "
          f"Average bet (if Wonging): {avg_non_zero_bet}, Risk of ruin: {avg_risk_of_ruin}")
    return profit, avg_profit, avg_bet, avg_risk_of_ruin


if __name__ == "__main__":
    parser = argparse.ArgumentParser(prog='Expected Value (EV) Calculation',
                                     description='Evaluate the profitability of different blackjack strategies by calculating'
                                                 ' their expected value (EV).')
    parser.add_argument("-c", "--custom", action='store_true',
                        help='Run custom user-defined movers and betters that require special initialization.')
    parser.add_argument("--cores", default=1, type=int,
                        help='How many cores to use in the calculation. (default: 1, use -1 for all cores)')
    parser.add_argument("-m", "--mover", default="card-count",
                        help='Use a predefined mover. Can also be the name of the class of a user-defined mover. '
                             '(possible values: card-count, basic-strategy-deviations, basic-strategy, perfect, simple; '
                             'default: card-count)')
    parser.add_argument("-b", "--better", default="card-count",
                        help='Use a predefined better. Can also be the name of the class of a user-defined better. '
                             '(possible values: card-count, conservative-card-count, wonging-card-count, '
                             'wonging-conservative-card-count, simple; default: card-count)')
    parser.add_argument("-s", "--simulations", default=100_000, type=int,
                        help='How many simulations to run. Running more simulations gives more accurate '
                             'results but they are slower to calculate. (default: 100,000)')
    parser.add_argument("--decks", default=6, type=int, help='How many decks the shoe starts with. (default: 6)')
    parser.add_argument("--deck-penetration", default=.25, type=float,
                        help='When to reshuffle the shoe. Reshuffles when cards remaining < starting cards'
                             ' * deck penetration. (default: 0.25)')
    parser.add_argument("--stand17", action='store_true', help='Dealer should stand on soft 17. (default: true)')
    parser.add_argument("--hit17", action='store_true', help='Dealer should hit on soft 17. (default: false)')
    parser.add_argument("--das", action='store_true', help='Allow double after split. (default: true)')
    parser.add_argument("--no-das", action='store_true', help='Don\'t allow double after split. (default: false)')
    parser.add_argument("--peek", action='store_true', help='Dealer peeks for blackjack. (default: true)')
    parser.add_argument("--no-peek", action='store_true', help="Dealer doesn't peek for blackjack. (default: false)")
    parser.add_argument("--surrender", action='store_true', help='Allow surrendering. (default: true)')
    parser.add_argument("--no-surrender", action='store_true', help='Don\'t allow surrendering. (default: false)')
    parser.add_argument("--units", default=200, type=int, help='The number of units in total. (default: 200)')
    parser.add_argument("--hands-played", default=1000, type=int,
                        help='How many hands to play before checking the risk of ruin. (default: 1000)')
    args = parser.parse_args()

    decks_number = args.decks
    stand_soft_17 = args.stand17 or (not args.hit17)
    das_allowed = args.das or (not args.no_das)
    peek_for_bj = args.peek or (not args.no_peek)
    can_surrender = args.surrender or (not args.no_surrender)

    cores_used = args.cores if args.cores != -1 else multiprocessing.cpu_count()

    if args.custom:
        # ADD CUSTOM CODE HERE IF YOU HAVE BUILT YOUR OWN MOVER OR BETTER.
        mover = BaseMover()  # Replace BaseMover with your own class.
        better = BaseBetter()  # Replace BaseBetter with your own class.
    else:
        mover, better = get_mover_and_better(args.mover, args.better)

    if cores_used > 1:
        expected_value_multithreading(mover, better, args.simulations, cores_used, args.decks, args.deck_penetration,
                                      peek_for_bj, das_allowed, stand_soft_17, can_surrender, args.units, args.hands_played)
    else:
        expected_value(mover, better, args.simulations, args.decks, args.deck_penetration, peek_for_bj, das_allowed,
                       stand_soft_17, can_surrender, args.units, args.hands_played)