Implement methods for finding representative period weights (#10)

TulipaEnergy · Dec 5, 2023 · 6a21c7f · 6a21c7f
1 parent 5c5e7d9
commit 6a21c7f
Show file tree

Hide file tree

Showing 8 changed files with 393 additions and 149 deletions.
diff --git a/src/TulipaClustering.jl b/src/TulipaClustering.jl
@@ -10,6 +10,7 @@ using SparseArrays
 include("input-tables.jl")
 include("structures.jl")
 include("io.jl")
+include("weight_fitting.jl")
 include("cluster.jl")
 
 end
diff --git a/src/cluster.jl b/src/cluster.jl
@@ -538,11 +538,6 @@ function find_representative_periods(
     throw(ArgumentError("Clustering method is not supported"))
   end
 
-  # If demands was rescaled, scale it back
-  if rescale_demand_data
-    rp_matrix[1:n_demand_rows, :] .*= demand_scaling_factor
-  end
-
   # Fill in the weight matrix using the assignments
   for (p, rp) ∈ enumerate(assignments)
     weight_matrix[p, rp] = complete_period_weight
@@ -552,6 +547,11 @@ function find_representative_periods(
 
   # First, convert the matrix data back to dataframes using the previously saved key columns
   demand_rp_df = matrix_and_keys_to_df(rp_matrix[1:n_demand_rows, :], demand_keys)
+  # If demands was rescaled, scale it back
+  if rescale_demand_data
+    demand_rp_df.value .*= demand_scaling_factor
+  end
+
   generation_availability_rp_df =
     matrix_and_keys_to_df(rp_matrix[(n_demand_rows + 1):end, :], generation_availability_keys)
 
@@ -574,5 +574,11 @@ function find_representative_periods(
     )
   end
 
-  return ClusteringResult(demand_rp_df, generation_availability_rp_df, weight_matrix)
+  return ClusteringResult(
+    demand_rp_df,
+    generation_availability_rp_df,
+    weight_matrix,
+    clustering_matrix,
+    rp_matrix,
+  )
 end
diff --git a/src/structures.jl b/src/structures.jl
@@ -46,9 +46,17 @@ Structure to hold the clustering result.
 mutable struct ClusteringResult
   demand::AbstractDataFrame
   generation_availability::AbstractDataFrame
-  weight_matrix::Matrix{Float64}
+  weight_matrix::Union{SparseMatrixCSC{Float64, Int64}, Matrix{Float64}}
+  clustering_matrix::Matrix{Float64}
+  rp_matrix::Matrix{Float64}
 
-  function ClusteringResult(demand, generation_availability, weight_matrix)
-    return new(demand, generation_availability, weight_matrix)
+  function ClusteringResult(
+    demand,
+    generation_availability,
+    weight_matrix,
+    clustering_matrix,
+    rp_matrix,
+  )
+    return new(demand, generation_availability, weight_matrix, clustering_matrix, rp_matrix)
   end
 end
diff --git a/src/weight_fitting.jl b/src/weight_fitting.jl
@@ -0,0 +1,251 @@
+export fit_rep_period_weights!
+
+"""
+  project_onto_simplex(vector)
+
+Projects `vector` onto a unit simplex using Michelot's algorithm in
+Condat's accelerated implementation (2017). See Figure 2 of
+[Condat, L. _Fast projection onto the simplex and the  ball._ Math. Program. 158,
+575–585 (2016).](https://doi.org/10.1007/s10107-015-0946-6). For the details on
+the meanings of v, ṽ, ρ and other variables, see the original paper.
+"""
+function project_onto_simplex(vector::Vector{Float64})
+  # There is a trivial solution when it's a one-element vector
+  if length(vector) == 1
+    return [1.0]
+  end
+  # step 1
+  v = [vector[1]]
+  ṽ = Vector{Float64}()
+  ρ = vector[1] - 1.0
+  # step 2
+  for y ∈ vector[2:end]
+    if y > ρ
+      ρ += (y - ρ) / (length(v) + 1)
+      if ρ > y - 1.0
+        push!(v, y)
+      else
+        append!(ṽ, v)
+        v = [y]
+        ρ = y - 1.0
+      end
+    end
+  end
+  # step 3
+  for y ∈ ṽ
+    if y > ρ
+      push!(v, y)
+      ρ += (y - ρ) / length(v)
+    end
+  end
+  # step 4
+  while true
+    length_v = length(v)
+    to_be_removed = Vector{Int}()
+    for (i, y) ∈ enumerate(v)
+      if y ≤ ρ
+        push!(to_be_removed, i)
+        length_v -= 1
+        ρ += (ρ - y) / length_v
+      end
+    end
+    if length(to_be_removed) == 0
+      break
+    end
+    deleteat!(v, to_be_removed)
+  end
+  # step 5 is skipped because it computes the data that we do not need
+  # step 6
+  return max.(vector .- ρ, 0.0)
+end
+
+"""
+  project_onto_nonnegative_orthant(vector)
+
+Projects `vector` onto the nonnegative_orthant. This projection is trivial:
+replace negative components of the vector with zeros.
+"""
+function project_onto_nonnegative_orthant(vector::Vector{Float64})
+  return max.(vector, 0.0)
+end
+
+"""
+  projected_subgradient_descent!(x; gradient, projection, niters, rtol, learning_rate, adaptive_grad)
+
+Fits `x` using the projected gradient descent scheme.
+
+The arguments:
+
+  - `x`: the value to fit
+  - `subgradient`: the subgradient operator, that is, a function that takes
+    vectors of the same shape as `x` as inputs and returns a subgradient of the
+    loss at that point; the fitting is done to minimize the corresponding
+    implicit loss
+  - `projection`: the projection operator, that is, a function that, given a
+    vector `x`, finds a point within some subspace that is closest to `x`
+  - `niters`: maximum number of projected gradient descent iterations
+  - `tol`: tolerance; when no components of `x` improve by more than `tol`, the
+    algorithm stops
+  - `learning_rate`: learning rate of the algorithm
+  - `adaptive_grad`: if true, the learning rate is adjusted using the adaptive
+    gradient method, see [John Duchi, Elad Hazan, and Yoram Singer. 2011.
+    _Adaptive Subgradient Methods for Online Learning and Stochastic
+      Optimization._ J. Mach. Learn. Res. 12, null (2/1/2011), 2121–2159.]
+      (https://dl.acm.org/doi/10.5555/1953048.2021068)
+"""
+function projected_subgradient_descent!(
+  x::Vector{Float64};
+  subgradient::Function,
+  projection::Function,
+  niters::Int = 100,
+  tol::Float64 = 1e-3,
+  learning_rate::Float64 = 0.001,
+  adaptive_grad = true,
+)
+  # It is possible that the initial guess is not in the required subspace;
+  # project it first.
+  x = projection(x)
+
+  if adaptive_grad
+    G = zeros(length(x))
+  end
+
+  for _ ∈ 1:niters
+    g = subgradient(x)  # find the subgradient
+    if adaptive_grad    # find the learning rate
+      G += g .^ 2
+      α = learning_rate ./ (1e-6 .+ .√(G))
+    else
+      α = learning_rate
+    end
+    y = x .- α .* g            # gradent step, may leave the domain
+    x_new = projection(y)      # projection step, return to the domain
+    diff = maximum(x_new - x)  # how much did the vector change
+    x = x_new
+    if diff ≤ tol
+      break
+    end
+  end
+  return x
+end
+
+"""
+  fit_rep_period_weights!(weight_matrix, clustering_matrix, rp_matrix; weight_type, tol, args...)
+
+Given the initial weight guesses, finds better weights for convex or conical
+combinations of representative periods. For conical weights, it is possible to
+bound the total weight by one.
+
+The arguments:
+
+  - `weight_matrix`: the initial guess for weights; the weights are adjusted
+    using a projected subgradient descent method
+  - `clustering_matrix`: the matrix of raw clustering data
+  - `rp_matrix`: the matrix of raw representative period data
+  - `weight_type`: the type of weights to find; possible values are:
+      - `:convex`: each period is represented as a convex sum of the
+        representative periods (a sum with nonnegative weights adding into one)
+      - `:conical`: each period is represented as a conical sum of the
+        representative periods (a sum with nonnegative weights)
+      - `:conical_bounded`: each period is represented as a conical sum of the
+        representative periods (a sum with nonnegative weights) with the total
+        weight bounded from above by one.
+  - `tol`: algorithm's tolerance; when the weights are adjusted by a value less
+    then or equal to `tol`, they stop being fitted further.
+  - other arguments control the projected subgradient method; they are passed
+    through to `TulipaClustering.projected_subgradient_descent!`.
+"""
+function fit_rep_period_weights!(
+  weight_matrix::Union{SparseMatrixCSC{Float64, Int64}, Matrix{Float64}},
+  clustering_matrix::Matrix{Float64},
+  rp_matrix::Matrix{Float64};
+  weight_type::Symbol = :dirac,
+  tol::Float64 = 10e-3,
+  args...,
+)
+  # Determine the appropriate projection method
+  if weight_type == :convex
+    projection = project_onto_simplex
+  elseif weight_type == :conical
+    projection = project_onto_nonnegative_orthant
+  elseif weight_type == :conical_bounded
+    # Conic bounded method does convex fitting, but adds a zero component.
+    # The weight of a zero vector is then discarded without affecting the
+    # total, and the resulting weights will always have sums between zero and
+    # one.
+    projection = project_onto_simplex
+    n_data_points = size(rp_matrix, 1)
+    rp_matrix = hcat(rp_matrix, repeat([0.0], n_data_points))
+  else
+    throw(ArgumentError("Unsupported weight type."))
+  end
+
+  n_periods = size(clustering_matrix, 2)
+  n_rp = size(rp_matrix, 2)
+
+  for period ∈ 1:n_periods  # TODO: this can be parallelized; investigate
+    target_vector = clustering_matrix[:, period]
+    x = Vector(weight_matrix[period, 1:n_rp])
+    if weight_type == :conical_bounded
+      x[n_rp] = 0.0
+    end
+    x = projected_subgradient_descent!(
+      x;
+      subgradient = (x) -> rp_matrix' * (rp_matrix * x - target_vector),
+      projection,
+      tol = tol,
+      args...,
+    )
+    x[x .< tol] .= 0.0  # replace insifnificant small values with zeros
+    if weight_type == :convex
+      # Because some values might have been removed, convexity can be lost.
+      # To account for these, the weights are re-normalized.
+      x = x ./ sum(x)
+    end
+    if weight_type == :conical_bounded
+      pop!(x)
+    end
+    weight_matrix[period, 1:length(x)] = x
+  end
+  return weight_matrix
+end
+
+"""
+  fit_rep_period_weights!(weight_matrix, clustering_matrix, rp_matrix; weight_type, tol, args...)
+
+  Given the initial weight guesses, finds better weights for convex or conical
+combinations of representative periods. For conical weights, it is possible to
+bound the total weight by one.
+
+The arguments:
+
+  - `clustering_result`: the result of running
+    `TulipaClustering.find_representative_periods`
+  - `weight_type`: the type of weights to find; possible values are:
+      - `:convex`: each period is represented as a convex sum of the
+        representative periods (a sum with nonnegative weights adding into one)
+      - `:conical`: each period is represented as a conical sum of the
+        representative periods (a sum with nonnegative weights)
+      - `:conical_bounded`: each period is represented as a conical sum of the
+        representative periods (a sum with nonnegative weights) with the total
+        weight bounded from above by one.
+  - `tol`: algorithm's tolerance; when the weights are adjusted by a value less
+    then or equal to `tol`, they stop being fitted further.
+  - other arguments control the projected subgradient method; they are passed
+    through to `TulipaClustering.projected_subgradient_descent!`.
+"""
+function fit_rep_period_weights!(
+  clustering_result = ClusteringResult;
+  weight_type::Symbol = :dirac,
+  tol::Float64 = 10e-3,
+  args...,
+)
+  fit_rep_period_weights!(
+    clustering_result.weight_matrix,
+    clustering_result.clustering_matrix,
+    clustering_result.rp_matrix;
+    weight_type,
+    tol,
+    args...,
+  )
+end