diff --git a/timm/models/regnet.py b/timm/models/regnet.py
index 93e31bd8..e6d0e646 100644
--- a/timm/models/regnet.py
+++ b/timm/models/regnet.py
@@ -143,8 +143,8 @@ default_cfgs = dict(
     regnety_320=_cfg(url='https://github.com/rwightman/pytorch-image-models/releases/download/v0.1-regnet/regnety_320-ba464b29.pth'),
 
     regnety_040s_gn=_cfg(url=''),
-    regnetv_040=_cfg(url=''),
-    regnetw_040=_cfg(url=''),
+    regnetv_040=_cfg(url='', first_conv='stem'),
+    regnetw_040=_cfg(url='', first_conv='stem', input_size=(3, 256, 256), pool_size=(8, 8)),
 
     regnetz_005=_cfg(url=''),
     regnetz_040=_cfg(url='', input_size=(3, 256, 256), pool_size=(8, 8)),
@@ -165,16 +165,19 @@ def adjust_widths_groups_comp(widths, bottle_ratios, groups):
     return widths, groups
 
 
-def generate_regnet(width_slope, width_initial, width_mult, depth, q=8):
+def generate_regnet(width_slope, width_initial, width_mult, depth, group_size, q=8):
     """Generates per block widths from RegNet parameters."""
     assert width_slope >= 0 and width_initial > 0 and width_mult > 1 and width_initial % q == 0
+    # TODO dWr scaling?
+    # depth = int(depth * (scale ** 0.1))
+    # width_scale = scale ** 0.4  # dWr scale, exp 0.8 / 2, applied to both group and layer widths
     widths_cont = np.arange(depth) * width_slope + width_initial
     width_exps = np.round(np.log(widths_cont / width_initial) / np.log(width_mult))
     widths = width_initial * np.power(width_mult, width_exps)
     widths = np.round(np.divide(widths, q)) * q
     num_stages, max_stage = len(np.unique(widths)), width_exps.max() + 1
-    widths, widths_cont = widths.astype(int).tolist(), widths_cont.tolist()
-    return widths, num_stages, max_stage, widths_cont
+    groups = np.array([group_size for _ in range(num_stages)])
+    return widths.astype(int).tolist(), num_stages, groups.astype(int).tolist()
 
 
 def downsample_conv(in_chs, out_chs, kernel_size=1, stride=1, dilation=1, norm_layer=None, preact=False):
@@ -395,14 +398,11 @@ class RegNet(nn.Module):
 
     def _get_stage_args(self, cfg: RegNetCfg, default_stride=2, output_stride=32, drop_path_rate=0.):
         # Generate RegNet ws per block
-        widths, num_stages, _, _ = generate_regnet(cfg.wa, cfg.w0, cfg.wm, cfg.depth)
+        widths, num_stages, stage_gs = generate_regnet(cfg.wa, cfg.w0, cfg.wm, cfg.depth, cfg.group_size)
 
         # Convert to per stage format
         stage_widths, stage_depths = np.unique(widths, return_counts=True)
-
-        # Use the same group width, bottleneck mult and stride for each stage
-        stage_groups = [cfg.group_size for _ in range(num_stages)]
-        stage_bottle_ratios = [cfg.bottle_ratio for _ in range(num_stages)]
+        stage_br = [cfg.bottle_ratio for _ in range(num_stages)]
         stage_strides = []
         stage_dilations = []
         net_stride = 2
@@ -416,15 +416,14 @@ class RegNet(nn.Module):
                 net_stride *= stride
             stage_strides.append(stride)
             stage_dilations.append(dilation)
-        stage_dpr = np.split(np.linspace(0, drop_path_rate, cfg.depth), np.cumsum(stage_depths[:-1]))
+        stage_dpr = np.split(np.linspace(0, drop_path_rate, sum(stage_depths)), np.cumsum(stage_depths[:-1]))
 
         # Adjust the compatibility of ws and gws
-        stage_widths, stage_groups = adjust_widths_groups_comp(stage_widths, stage_bottle_ratios, stage_groups)
+        stage_widths, stage_gs = adjust_widths_groups_comp(stage_widths, stage_br, stage_gs)
         arg_names = ['out_chs', 'stride', 'dilation', 'depth', 'bottle_ratio', 'group_size', 'drop_path_rates']
         per_stage_args = [
             dict(zip(arg_names, params)) for params in
-            zip(stage_widths, stage_strides, stage_dilations, stage_depths, stage_bottle_ratios, stage_groups,
-                stage_dpr)]
+            zip(stage_widths, stage_strides, stage_dilations, stage_depths, stage_br, stage_gs, stage_dpr)]
         common_args = dict(
             downsample=cfg.downsample, se_ratio=cfg.se_ratio, linear_out=cfg.linear_out,
             act_layer=cfg.act_layer, norm_layer=cfg.norm_layer)