Added the HttpClient config options into the config file

nemethviktor · nemethviktor · commit 93428c7a0eeb · 2024-03-16T09:52:38.000Z
diff --git a/FrmMainApp.cs b/FrmMainApp.cs
@@ -32,32 +32,45 @@ public partial class FrmMainApp : Form
     internal static IEnumerable<ETFType>? ETF_Types;
 
     private Configuration _config;
-    private KeyValueConfigurationCollection _section = new();
+    private readonly KeyValueConfigurationCollection _settingsSection = new();
     private CancellationTokenSource cancellationTokenSource;
 
     private static HttpClient _httpClient = new();
 
     public FrmMainApp()
     {
         cancellationTokenSource = new CancellationTokenSource();
+        _config = ConfigurationManager.OpenExeConfiguration(userLevel: ConfigurationUserLevel.None);
+        _settingsSection = _config.AppSettings.Settings;
 
         InitializeComponent();
         GetETFTypesFromCSV();
 
+        double pooledConnectionLifetimeSetting = _settingsSection.AllKeys.Contains(value: "PooledConnectionLifetime")
+            ? Convert.ToDouble(value: _settingsSection[key: "PooledConnectionLifetime"].Value)
+            : 2;
+        double pooledConnectionIdleTimeoutSetting =
+            _settingsSection.AllKeys.Contains(value: "PooledConnectionIdleTimeout")
+                ? Convert.ToDouble(value: _settingsSection[key: "PooledConnectionIdleTimeout"].Value)
+                : 1;
+        int maxConnectionsPerServerSetting = _settingsSection.AllKeys.Contains(value: "MaxConnectionsPerServer")
+            ? Convert.ToInt32(value: _settingsSection[key: "MaxConnectionsPerServer"].Value)
+            : 100;
+
+
         SocketsHttpHandler socketsHandler = new()
         {
-            PooledConnectionLifetime = TimeSpan.FromMinutes(value: 2),
-            MaxConnectionsPerServer = 100
+            PooledConnectionLifetime = TimeSpan.FromMinutes(value: pooledConnectionLifetimeSetting),
+            PooledConnectionIdleTimeout = TimeSpan.FromMinutes(value: pooledConnectionIdleTimeoutSetting),
+            MaxConnectionsPerServer = maxConnectionsPerServerSetting
         };
 
         _httpClient = new HttpClient(handler: socketsHandler);
     }
 
     private void FrmMainApp_Load(object sender, EventArgs e)
     {
-        _config = ConfigurationManager.OpenExeConfiguration(userLevel: ConfigurationUserLevel.None);
-        _section = _config.AppSettings.Settings;
-        if (_section[key: "Theme"].Value == "Dark") tsmi_DarkishMode.PerformClick();
+        if (_settingsSection[key: "Theme"].Value == "Dark") tsmi_DarkishMode.PerformClick();
 
         btn_StartScrape.Enabled = true;
         btn_Stop.Enabled = false;
@@ -707,7 +720,7 @@ private void tsmi_DarkishMode_Click(object sender, EventArgs e)
         HelperVariables.UserSettingUseDarkMode = tsmi_DarkishMode.Checked;
         SetAppTheme();
 
-        _section[key: "Theme"].Value = HelperVariables.UserSettingUseDarkMode ? "Dark" : "Light";
+        _settingsSection[key: "Theme"].Value = HelperVariables.UserSettingUseDarkMode ? "Dark" : "Light";
 
         _config.Save(saveMode: ConfigurationSaveMode.Modified);
         ConfigurationManager.RefreshSection(sectionName: _config.AppSettings.SectionInformation.Name);
diff --git a/app.config b/app.config
@@ -2,5 +2,8 @@
 <configuration>
   <appSettings>
     <add key="Theme" value="Light"/>
+	<add key="PooledConnectionLifetime" value="2"/>
+	<add key="PooledConnectionIdleTimeout" value="1"/>
+	<add key="MaxConnectionsPerServer" value="100"/>
   </appSettings>
 </configuration>
diff --git a/changelog.md b/changelog.md
@@ -3,6 +3,7 @@
 **Build 88xx [202403xx] ** 
 - NEW & UPDATED:
   - I've rewritten the HttpClient handling. Should have read up on the documentation beforehand - no more loops!
+  - Added the HttpClient config options into the config file, though I strongly suggest not changing them.
   
 - BUGS & FIXES:
   - N/A
diff --git a/readme.md b/readme.md
@@ -40,8 +40,8 @@ On that note the app can only collect stuff that's either visibly available on t
 
 ### Performance
 
-- The whole data pull is around 4.5GB but it appears to be capped on the server side somewhere around 15-20MB/sec (that's around 200 megabits/sec).
-- The whole end-to-end process (assuming favourable conditions) takes around 10-15 mins.
+- The data pull is around 4.5GB (cca 22,800 pages at the time of initial publication) but the transfer rate appears to be capped on the server side somewhere around 15-20MB/sec (that's around 200 megabits/sec).
+- The end-to-end process (assuming favourable conditions) takes around 10-15 mins.
 - The app uses a library (`CompressedMemoryCache.cs`) - the licence of that is contained in the file and was built by Gustavo Augusto Hennig (it's APACHE 2.0 btw)
     - It's necessary to use compression on the html pages because storing that many (read: tens of thousands) pages at 200-400kbytes each will eat up memory in no time. My initial tests of letters A-C made the app consume around 5GB RAM w/o compression and sub-1GB w/ compression.
 - I did some testing on what I deem is a 'normal' performance laptop, ie a Ryzen 7 PRO 5850U [8x 4370 MHz] w/ 32 GB RAM - the Release (non-Debug that is) version of the app peaked at 25% CPU and (again) around sub-1GB RAM.
@@ -87,7 +87,9 @@ I'm generally happy for anyone competent to add pull requests but I don't always
 
 ## Known Issues
 
-- "Ticker" extraction works on the basis of getting whatever's in the last parentheses of the header. This is because HL website doesn't appear to store this info separately. In some rare cases (espc w/ Trusts) this can yield odd results. (e.g. [here](https://www.hl.co.uk/shares/shares-search-results/b/baillie-gifford-us-growth-trust-ord) we'd pick up "USA", which is wrong.)
+- "Ticker" extraction works on the basis of getting whatever's in the last parentheses of the header. This is because HL website doesn't appear to store this info separately. In some rare cases (espc w/ Trusts) this can yield odd results. e.g.: 
+    - [here](https://www.hl.co.uk/shares/shares-search-results/b/baillie-gifford-us-growth-trust-ord) we'd pick up "USA", which I'm not sure about, whereas
+    - [this one](https://www.hl.co.uk/shares/shares-search-results/a/argentina-1-bds-090729-usd1) gets entirely discarded because there's no ticker.
 - The "Sector" classification can occasionally mislabel securities as ETFs particularly when their name contains the word "Fund" or "Income". HL doesn't actually have an ETF-flag so the code attempts to decipher what's what. This works around 98% of the cases.
 
 ## When reporting bugs please specify