> ## Documentation Index
> Fetch the complete documentation index at: https://developer.upsun.com/llms.txt
> Use this file to discover all available pages before exploring further.

# Auto-scaling on Upsun Flex. A deep dive.

> Learn how Upsun's autoscaling dynamically adjusts application instances based on CPU usage, ensuring performance during traffic spikes while optimizing costs.

export const PostMeta = ({data = {}}) => {
  const {author, date} = data;
  const authors = Array.isArray(author) ? author : author ? [author] : [];
  const toSlug = value => String(value).toLowerCase().trim().replace(/\s+/g, '-').replace(/[^a-z0-9-]/g, '');
  const resolveAuthor = slug => {
    const entry = AUTHOR_MAP[slug] || ({});
    const name = entry.name || slug;
    const github = entry.github || null;
    const url = `/posts/authors/${toSlug(slug)}`;
    const avatarUrl = github ? `https://github.com/${github}.png?size=64` : null;
    return {
      name,
      url,
      avatarUrl
    };
  };
  const formattedDate = date ? new Date(date).toLocaleDateString('en-US', {
    year: 'numeric',
    month: 'long',
    day: 'numeric'
  }) : null;
  if (authors.length === 0 && !formattedDate) return null;
  const AUTHOR_MAP = {
    "aaron-collier": {
      "name": "Aaron Collier"
    },
    "aaron-dudenhofer": {
      "name": "Aaron Dudenhofer"
    },
    "aaron-porter": {
      "name": "Aaron Porter"
    },
    "adriaan-odendaal": {
      "name": "Adriaan Odendaal"
    },
    "ajmal": {
      "name": "Ajmal Siddiqui"
    },
    "akalipetis": {
      "name": "Antonis Kalipetis"
    },
    "alexander-varwijk": {
      "name": "Alexander Varwijk"
    },
    "alicia-bevilacqua": {
      "name": "Alicia Bevilacqua"
    },
    "amelie-deguerry": {
      "name": "Amelie Deguerry"
    },
    "anacidre": {
      "name": "Ana Cidre",
      "linkedin": "https://www.linkedin.com/in/ana-cidre"
    },
    "andoni": {
      "name": "Andoni Auzmendi"
    },
    "andrei-taranu": {
      "name": "Andrei (Alex) Taranu",
      "linkedin": "https://www.linkedin.com/in/andrei-alex-taranu/"
    },
    "andrew-baxter": {
      "name": "Andrew Baxter"
    },
    "andrew-melck": {
      "name": "Andrew Melck"
    },
    "antoine-crochet-damais": {
      "name": "Antoine Crochet Damais"
    },
    "augustin-delaporte": {
      "name": "Augustin Delaporte",
      "linkedin": "https://www.linkedin.com/in/augustindelaporte/"
    },
    "branislav-bujisic": {
      "name": "Branislav Bujisic"
    },
    "carl-smith": {
      "name": "Carl Smith"
    },
    "caroline-leroy": {
      "name": "Caroline Leroy"
    },
    "cati-mayer": {
      "name": "Cati Mayer"
    },
    "catplat": {
      "name": "C Trinkwon"
    },
    "ceelolulu": {
      "name": "Celeste van der Watt"
    },
    "chadwcarlson": {
      "name": "Chad Carlson",
      "github": "chadwcarlson",
      "linkedin": "https://www.linkedin.com/in/chadwcarlson"
    },
    "chris-ward": {
      "name": "Chris Ward"
    },
    "chris-yates": {
      "name": "Chris Yates"
    },
    "christian-sieber": {
      "name": "Christian Sieber"
    },
    "christopher-lockheardt": {
      "name": "Christopher Lockheardt"
    },
    "christopher-skene": {
      "name": "Christopher Skene"
    },
    "chuck-morgan": {
      "name": "Chuck Morgan"
    },
    "corey-dockendorf": {
      "name": "Corey Dockendorf"
    },
    "crell": {
      "name": "Crell"
    },
    "damz": {
      "name": "Damz"
    },
    "dan-morrison": {
      "name": "Dan Morrison"
    },
    "davidbonachera": {
      "name": "David Bonachera",
      "github": "davidbonachera",
      "linkedin": "https://www.linkedin.com/in/davidbonachera"
    },
    "dereliahmet1": {
      "name": "Ahmet Faruk Dereli"
    },
    "devicezero": {
      "name": "Jonas Kröger",
      "github": "devicezero",
      "linkedin": "https://www.linkedin.com/in/jonaskroeger/"
    },
    "doug-goldberg": {
      "name": "Doug Goldberg"
    },
    "duncan-naves": {
      "name": "Duncan Naves",
      "github": "duncannaves",
      "linkedin": "https://www.linkedin.com/in/duncan-naves-a94423aa"
    },
    "erika-bustamante": {
      "name": "Erika Bustamante"
    },
    "fabpot": {
      "name": "Fabien Potencier"
    },
    "flovntp": {
      "name": "Florent Huck",
      "github": "flovntp",
      "linkedin": "https://www.linkedin.com/in/florenthuck"
    },
    "fred-plais": {
      "name": "Fred Plais"
    },
    "gauthier-garnier": {
      "name": "Gauthier Garnier"
    },
    "gilzow": {
      "name": "Paul Gilzow"
    },
    "gmoigneu": {
      "name": "Guillaume Moigneu",
      "github": "gmoigneu",
      "linkedin": "https://www.linkedin.com/in/guillaumemoigneu/"
    },
    "gregqualls": {
      "name": "Greg Qualls"
    },
    "guguss": {
      "name": "Augustin Delaporte"
    },
    "haylee-millar": {
      "name": "Haylee Millar"
    },
    "ivana-kotur": {
      "name": "Ivana Kotur"
    },
    "jackrabbithanna": {
      "name": "Mark Hanna",
      "github": "jackrabbithanna"
    },
    "jared-wright": {
      "name": "Jared Wright",
      "github": "jww-sh",
      "linkedin": "https://www.linkedin.com/in/jaredwaynewright"
    },
    "jessica-orozco": {
      "name": "Jessica Orozco"
    },
    "joey-stanford": {
      "name": "Joey Stanford"
    },
    "john-grubb": {
      "name": "John Grubb"
    },
    "jonas-kruger": {
      "name": "Jonas Kruger"
    },
    "kathryn-frazer": {
      "name": "Kathryn Frazer"
    },
    "kemiojo": {
      "name": "Kemi Elizabeth Ojogbede"
    },
    "kieronsambrook-smith": {
      "name": "Kieronsambrook Smith"
    },
    "laurent-arnoud": {
      "name": "Laurent Arnoud",
      "linkedin": "https://www.linkedin.com/in/laurent-arnoud-861b44121/"
    },
    "letoya-boyne": {
      "name": "Letoya Boyne"
    },
    "lolautruche": {
      "name": "Jérôme Vieilledent"
    },
    "lyly-lepinay": {
      "name": "Lyly Lepinay"
    },
    "manauwar-alam": {
      "name": "Manauwar Alam"
    },
    "marc-antoine-porri": {
      "name": "Marc Antoine Porri"
    },
    "maria-antinkaapo": {
      "name": "Maria Antinkaapo"
    },
    "maria-de-anton": {
      "name": "Maria De Anton"
    },
    "mark-dorison": {
      "name": "Mark Dorison"
    },
    "markus-hausammann": {
      "name": "Markus Hausammann"
    },
    "mary-thomas": {
      "name": "Mary Thomas"
    },
    "mathias-bolt-lesniak": {
      "name": "Mathias Bolt Lesniak"
    },
    "mathieu-strauch": {
      "name": "Mathieu Strauch"
    },
    "matthias-van-woensel": {
      "name": "Matthias Van Woensel",
      "linkedin": "https://www.linkedin.com/in/matthias-van-woensel-267a069"
    },
    "maz-mohammadi": {
      "name": "Maz Mohammadi"
    },
    "michael-sharp": {
      "name": "Michael Sharp"
    },
    "mupsi": {
      "name": "Marine Gandy"
    },
    "natalie-harper": {
      "name": "Natalie Harper"
    },
    "ngommenginger": {
      "name": "Nicolas Gommenginger",
      "linkedin": "https://www.linkedin.com/in/nicolas-gommenginger"
    },
    "nicholas-bennison": {
      "name": "Nicholas Bennison"
    },
    "nicholas-vahalik": {
      "name": "Nicholas Vahalik"
    },
    "nick-hardiman": {
      "name": "Nick Hardiman"
    },
    "nickanderegg": {
      "name": "Nickanderegg"
    },
    "nicolas-grekas": {
      "name": "Nicolas Grekas",
      "github": "nicolas-grekas",
      "linkedin": "https://www.linkedin.com/in/nicolasgrekas/"
    },
    "niti-malwade": {
      "name": "Niti Malwade"
    },
    "opensocialteam": {
      "name": "Opensocialteam"
    },
    "ori-pekelman": {
      "name": "Ori Pekelman"
    },
    "otavio-santana": {
      "name": "Otavio Santana"
    },
    "palwandi": {
      "name": "Pawan Alwandi",
      "github": "pawpy",
      "linkedin": "https://www.linkedin.com/in/pawanalwandi"
    },
    "patrick-boest": {
      "name": "Patrick Boest"
    },
    "patrick-dawkins": {
      "name": "Patrick Dawkins",
      "github": "pjcdawkins",
      "linkedin": "https://www.linkedin.com/in/patrickdawkins"
    },
    "patrick-klima": {
      "name": "Patrick Klima"
    },
    "pjcdawkins": {
      "name": "Pjcdawkins"
    },
    "prineet-kaurbhurji": {
      "name": "Prineet Kaurbhurji"
    },
    "quentin-sinig": {
      "name": "Quentin Sinig"
    },
    "ralt": {
      "name": "Florian Margaine",
      "github": "ralt",
      "linkedin": "https://www.linkedin.com/in/florian-margaine-43971136"
    },
    "ramanathanramakrishnamurthy": {
      "name": "Ramanathanramakrishnamurthy"
    },
    "remi-lejeune": {
      "name": "Rémi Lejeune"
    },
    "ribel": {
      "name": "Taras Kruts"
    },
    "robert-douglass": {
      "name": "Robert Douglass"
    },
    "rudy-weber": {
      "name": "Rudy Weber"
    },
    "ryan-hicks": {
      "name": "Ryan Hicks"
    },
    "sabri-helal": {
      "name": "Sabri Helal"
    },
    "savannah-bergeron": {
      "name": "Savannah Bergeron"
    },
    "shannon-vettes": {
      "name": "Shannon Vettes"
    },
    "shawn-ogasawara": {
      "name": "Shawn Ogasawara",
      "linkedin": "https://www.linkedin.com/in/shawn-ogasawara-83a9a0/"
    },
    "shawna-spoor": {
      "name": "Shawna Spoor"
    },
    "shedrack-akintayo": {
      "name": "Shedrack Akintayo"
    },
    "simon-ruggier": {
      "name": "Simon Ruggier"
    },
    "sophie-van-der-kindere": {
      "name": "Sophie Van Der Kindere"
    },
    "stefanos-thampis": {
      "name": "Stefanos Thampis"
    },
    "stephen-weinberg": {
      "name": "Stephen Weinberg"
    },
    "sukhman-virk": {
      "name": "Sukhman Virk"
    },
    "sumaira-nazir": {
      "name": "Sumaira Nazir"
    },
    "sumer": {
      "name": "Sümer Cip"
    },
    "syed-raza": {
      "name": "Syed Raza"
    },
    "tamara-bacchia": {
      "name": "Tamara Bacchia"
    },
    "tara-arnold": {
      "name": "Tara Arnold"
    },
    "theosakamg": {
      "name": "Mickael Gaillard",
      "github": "theosakamg"
    },
    "thomasdiluccio": {
      "name": "Thomas di Luccio"
    },
    "tim-anderson": {
      "name": "Tim Anderson"
    },
    "tom-helmer-hansen": {
      "name": "Tom Helmer Hansen"
    },
    "tylermills": {
      "name": "Tyler Mills"
    },
    "upsun": {
      "name": "Upsun"
    },
    "veronika-tolkachova": {
      "name": "Veronika Tolkachova",
      "linkedin": "https://www.linkedin.com/in/veronika-tolkachova-169167a2"
    },
    "vince-parker": {
      "name": "Vince Parker"
    },
    "vinnie-russo": {
      "name": "Vincenzo Russo"
    },
    "vrobert78": {
      "name": "Vincent Robert",
      "github": "vrobert78",
      "linkedin": "https://www.linkedin.com/in/vincent-robert-498a883"
    },
    "yuriy-babenko": {
      "name": "Yuriy Babenko"
    },
    "yuriy-gerasimov": {
      "name": "Yuriy Gerasimov"
    }
  };
  return <div className="post-meta">
      {(authors.length > 0 || formattedDate) && <div className="post-meta-info">
          {authors.length > 0 && <div className="post-meta-authors">
              {authors.map(slug => {
    const {name, url, avatarUrl} = resolveAuthor(slug);
    const inner = <>
                    {avatarUrl && <img src={avatarUrl} alt={name} className="post-meta-avatar" />}
                    <span className="post-meta-author-name">{name}</span>
                  </>;
    return url ? <a key={slug} href={url} className="post-meta-author">
                    {inner}
                  </a> : <span key={slug} className="post-meta-author">{inner}</span>;
  })}
            </div>}
          {authors.length > 0 && formattedDate && <span className="post-meta-separator" aria-hidden="true">·</span>}
          {formattedDate && <span className="post-meta-date">{formattedDate}</span>}
        </div>}
    </div>;
};

<PostMeta data={{ author: ["gmoigneu", "flovntp"], date: "2025-10-20T00:00:00+00:00", image: "/images/posts/how-it-works/autoscaling-deep-dive/autoscaling-deep-dive.webp" }} />

## Introduction

Traffic doesn't arrive on schedule. Your application might handle steady requests for hours, then face a sudden spike from a product launch, marketing campaign, or unexpected viral moment. Manual scaling requires you to predict these patterns and adjust resources ahead of time, often leading to over-provisioning during quiet periods or scrambling to add capacity during peak load.

Upsun's new [autoscaling feature](https://docs.upsun.com/manage-resources/autoscaling.html) removes this guesswork. Your applications automatically scale horizontally based on real-time CPU metrics, adding instances when demand increases and removing them when traffic subsides. This ensures consistent performance for your users while keeping infrastructure costs aligned with actual usage.

## How autoscaling works on Upsun

### The scaling mechanism

Autoscaling continuously monitors average CPU utilization across all running instances of your application. When you configure autoscaling, you define two critical [thresholds](https://docs.upsun.com/manage-resources/autoscaling.html#thresholds):

**Scale-up threshold**: When average CPU usage exceeds this level for your configured evaluation period, Upsun launches additional instances to distribute the load. The default threshold is 80% CPU for 5 minutes.

**Scale-down threshold**: When average CPU usage falls below this level for the evaluation period, Upsun removes unnecessary instances to reduce costs. The default threshold is 20% CPU for 5 minutes.

Between scaling actions, a cooldown window prevents rapid fluctuations. This waiting period (default: 5 minutes) ensures the system stabilizes before making another adjustment.

### Architecture considerations

Autoscaling applies specifically to application containers, including your [PHP](https://docs.upsun.com/languages/php.html), [Node.js](https://docs.upsun.com/languages/nodejs.html), [Python](https://docs.upsun.com/languages/python.html), or [other runtime](https://docs.upsun.com/languages.html) environments. Services like [MySQL](https://docs.upsun.com/add-services/mysql.html), [PostgreSQL](https://docs.upsun.com/add-services/postgresql.html), [Redis](https://docs.upsun.com/add-services/redis.html), and [Elasticsearch](https://docs.upsun.com/add-services/elasticsearch.html) continue to scale vertically through manual configuration. This separation makes sense because databases and caches typically require different scaling strategies than stateless application layers.

```mermaid theme={null}
graph LR
    subgraph Upsun_Environment["Upsun Environment"]
        Router[Router]

        subgraph Application_Layer["Application Layer"]
            PHP1["PHP App<br/>Instance 1<br/>CPU: 85%"]
            PHP2["PHP App<br/>Instance 2<br/>CPU: 82%"]
            PHP3["PHP App<br/>Instance 3<br/>CPU: 79%"]
        end
        
        Network[Internal Network]

        subgraph Service_Layer["Service Layer"]
            MySQL["MySQL Primary<br/>4 CPU / 6.7 GB"]
            ES["Elasticsearch<br/>2 CPU / 4 GB"]
            Network_Storage["Network Storage<br/>"]
        end

        Router --> PHP1
        Router --> PHP2
        Router --> PHP3

        PHP1 --> Network
        PHP2 --> Network
        PHP3 --> Network

        Network -.-> MySQL
        Network -.-> Network_Storage
        Network -.-> ES
    end

    style Application_Layer fill:#D0F302,stroke:#000,color:#000
    style Service_Layer fill:#fff,stroke:#000,color:#000
    style Router fill:#000,stroke:#000,color:#D0F302
    style PHP1 fill:#D0F302,stroke:#000,color:#000
    style PHP2 fill:#D0F302,stroke:#000,color:#000
    style PHP3 fill:#D0F302,stroke:#000,color:#000
    style Network fill:#000,stroke:#000,color:#fff
    style MySQL fill:#6046FF,stroke:#000,color:#fff
    style ES fill:#6046FF,stroke:#000,color:#fff
    style Network_Storage fill:#6046FF,stroke:#000,color:#fff
```

### Practical example: E-commerce traffic spike

Consider a [Magento](https://docs.upsun.com/get-started/stacks/magento.html) storefront running on Upsun. During normal business hours, two PHP application instances handle incoming requests comfortably, maintaining 40% average CPU usage.

A flash sale begins at noon. Traffic increases fivefold within minutes. Average CPU across your two instances climbs to 85% and stays there for 5 minutes. Autoscaling detects this sustained elevation above the 80% threshold and launches a third instance. The load distributes across three containers, bringing average CPU down to 60%.

As the sale winds down two hours later, traffic returns to baseline levels. Average CPU drops to 25%, then 18% over the evaluation period. Autoscaling waits for the cooldown window to expire, confirms CPU remains below 20% for another 5 minutes, then removes one instance. Your infrastructure returns to two instances, matching the original capacity.

Throughout this cycle, your MySQL database and Elasticsearch service continue running with their manually configured resources: 4 CPU with 6.7 GB RAM for MySQL, 2 CPU with 4 GB RAM for Elasticsearch. These services don't need horizontal scaling for this workload pattern.

## Configure autoscaling for your application

### Enable autoscaling through the Console

Access your project in the Upsun Console and select the environment where you want autoscaling:

<img src="https://mintcdn.com/upsun-c9761871/tziXiwEbbKjwbX3l/images/posts/how-it-works/autoscaling-deep-dive/autoscaling-config.gif?s=5133b631655afc3ba89d672ed329b1cb" alt="Autoscaling config" width="3024" height="1888" data-path="images/posts/how-it-works/autoscaling-deep-dive/autoscaling-config.gif" />

1. Click **Configure resources** in the project card
2. Locate the autoscaling column for your application
3. Select **Enable**
4. Configure your thresholds and guardrails:
   * **Scale-up threshold**: CPU percentage that triggers instance addition (default: 80%)
   * **Scale-down threshold**: CPU percentage that triggers instance removal (default: 20%)
   * **Evaluation period**: How long metrics must exceed thresholds (1-60 minutes, default: 5)
   * **Cooldown window**: Wait time between scaling actions (default: 5 minutes)
   * **Minimum instances**: Baseline capacity that's always available (default: 1)
   * **Maximum instances**: Upper limit to prevent runaway scaling (default: 8, region-dependent)

### Understand your guardrails

Minimum and maximum instance counts act as safety boundaries. Setting minimum instances to 2 ensures your application maintains redundancy even during low traffic periods. This prevents a single point of failure and gives you instant capacity if traffic arrives suddenly.

Maximum instances protect against unexpected scaling costs. If your application experiences abnormal behavior (perhaps a bug causing excessive CPU usage), the maximum cap prevents unlimited resource consumption.

### Available triggers

Currently, autoscaling responds to **average CPU utilization** as its primary trigger. This metric provides a reliable indicator of application load across most workload types. Future releases will add memory-based triggers for applications with different resource consumption patterns.

## Autoscaling for different roles

### For developers: Implementation patterns

When you enable autoscaling, your application architecture becomes critical. Store session data in Redis or another shared service rather than in memory or local filesystem—sessions won't transfer between instances, breaking user experience. Similarly, use object storage (S3-compatible services) or network storage for uploaded files, since mount points on one instance won't appear on others.

Design your application to be stateless. Each instance should handle requests identically without depending on previous requests processe

### For technical leads: Capacity planning

Autoscaling shifts capacity planning from prediction to configuration. Set your scale-up threshold based on acceptable response times. If 80% CPU correlates with sub-200ms responses, that threshold maintains performance during growth. Evaluation periods balance responsiveness against stability. Short periods (2-3 minutes) respond quickly but may scale unnecessarily for brief spikes, while longer periods (10-15 minutes) provide stability at the cost of slower response.

For applications with predictable traffic patterns, like daily peaks at specific hours, consider scheduling vertical resource adjustments to supplement autoscaling. Scale CPU and RAM on your baseline instances before known traffic increases, then let autoscaling handle horizontal expansion as needed.

### For business decision-makers: Cost and availability optimization

Traditional fixed-capacity infrastructure requires paying for peak capacity around the clock. A retail site needing 8 application instances during holiday shopping peaks runs those 8 instances all year, including slow January weeks when traffic drops 70%. Autoscaling aligns costs with revenue-generating activity. During low-traffic periods, infrastructure scales down to minimum instances, reducing spend. When traffic and sales increase, scaling adds capacity automatically.

Reliability improves through automatic response to load. Manual scaling requires someone to notice performance degradation, access infrastructure controls, and trigger scaling actions. By the time this happens, users may have already experienced slow responses or errors. Autoscaling responds within minutes of detecting elevated load, often before human intervention would begin.

## Monitor autoscaling behavior

### Metrics and dashboards

Upsun provides several visibility layers for autoscaling activity. The [Infrastructure Metrics dashboard](https://docs.upsun.com/increase-observability/metrics/http-metrics.html) displays current instance count alongside CPU, memory, and request metrics. Track how scaling responds to traffic patterns and identify opportunities to refine thresholds.

Application metrics through Blackfire integration show performance impact at the code level. Compare response times and throughput across different instance counts to verify scaling improves application behavior as expected.

### Alerts and notifications

The Console displays scaling events with specific icons:

* Bell icon: Threshold alerts (e.g., "CPU above 80% for 5 minutes")
* Resources icon: Scaling actions (e.g., "1 instance added to application")

Configure custom notifications by setting up activity scripts that respond to `environment.alert` events. Send [Slack messages](https://docs.upsun.com/integrations/activity/slack.html), emails, or [webhook notifications](https://docs.upsun.com/integrations/activity/webhooks.html) when scaling occurs. This provides operational awareness without requiring constant dashboard monitoring.

### CLI access

Use the Upsun CLI to review [scaling events](https://docs.upsun.com/integrations/activity/reference.html#type) programmatically:

```bash {filename="Terminal"} theme={null}
upsun activity:list --type environment.alert
upsun activity:list --type environment.resources.update
```

These commands show historical scaling actions, including timestamps, triggering conditions, and resulting instance counts.

## Cost implications and billing

Autoscaling projects bill for consumed resources. Each instance added through autoscaling incurs the same charges as a manually configured instance with equivalent CPU and RAM.

Calculate maximum potential costs by multiplying your single-instance resource allocation by your maximum instance count. An application configured for 2 CPU and 4 GB RAM with maximum instances of 8 could consume up to 16 CPU and 32 GB RAM during peak scaling.

Monitor actual usage patterns through the billing dashboard. Compare costs across time periods to identify opportunities for optimization. If your application consistently runs at maximum instances, either traffic has permanently increased (requiring higher baseline resources), or your thresholds need adjustment to prevent aggressive scaling.

## Best practices and optimization strategies

### Threshold tuning

Start with default thresholds (80% scale-up, 20% scale-down) and adjust based on observed behavior. Applications with consistent, predictable load benefit from tighter thresholds (75% up, 30% down) that maintain resources closer to actual needs. Applications with spiky, unpredictable traffic need wider thresholds to prevent constant scaling fluctuations.

Monitor the frequency of scaling events. Multiple scale-up and scale-down cycles within an hour suggest overly sensitive thresholds or too-short evaluation periods. Adjust one parameter at a time to isolate the effect of each change.

### Application design for horizontal scaling

External services (databases, caches, search indexes) should live outside your application containers. Upsun's service architecture supports this naturally. Your application containers connect to services through configuration, allowing instances to share data stores without architectural changes.

Avoid local state within application containers. Each instance should handle requests identically, without depending on previous requests processed by the same instance. Store session data in [Redis](https://docs.upsun.com/add-services/redis.md), [Valkey](https://docs.upsun.com/add-services/valkey.md), or your database. Never store sessions in local memory or filesystem. Redis and Valkey offer the best performance for session storage with their in-memory architecture, while database storage provides an alternative if you already have a database service configured. This ensures the load balancer can distribute traffic efficiently across all available instances without breaking user sessions.

For file storage and volumes, use [Network Storage](https://docs.upsun.com/add-services/network-storage.md) to ensure all application instances can access the same files. Standard mounts are local to each container. Files written to one instance won't appear on others. Network Storage provides a shared filesystem accessible across all instances, perfect for user uploads, generated assets, or any files that need to persist across your horizontally scaled application layer. Configure Network Storage as a service in your project, then mount it in your application configuration following the guidelines for [composable images](https://docs.upsun.com/create-apps/app-reference/composable-image.md#mounts) or [single-runtime images](https://docs.upsun.com/create-apps/app-reference/single-runtime-image.md#mounts).

### Evaluation periods and cooldown windows

Longer evaluation periods (10-15 minutes) work well for applications where traffic changes gradually. E-commerce sites often see traffic build over 30-60 minutes as promotions spread through email and social media. A 15-minute evaluation period prevents scaling for temporary spikes while responding appropriately to sustained growth.

API services handling burst traffic need shorter periods (3-5 minutes). These applications see rapid load changes that require quick response. Balance this against cooldown windows to prevent oscillation.

### Managing cron jobs

[Cron jobs](https://docs.upsun.com/create-apps/app-reference/single-runtime-image.html#crons) executing during scaling events continue on their original instance until completion. This prevents interrupted tasks but means CPU-intensive cron jobs may trigger scale-ups.

Schedule resource-intensive jobs during known low-traffic periods. Database maintenance, report generation, and data processing work better late at night or early morning when autoscaling runs at minimum capacity.

Alternatively, move long-running tasks to dedicated [worker](https://docs.upsun.com/create-apps/app-reference/single-runtime-image.html#workers) containers that scale independently. Separate [cron job](https://docs.upsun.com/create-apps/app-reference/single-runtime-image.html#crons) execution from request handling, giving you fine-grained control over resources for each workload type.

## Advanced scenario: Multi-app autoscaling

Upsun's [multi-app architecture](https://docs.upsun.com/create-apps.html#use-multiple-apps) allows different applications within a single project to scale independently. Consider a headless commerce implementation:

* **API application** (Node.js): Handles product data, cart operations, checkout
* **Frontend application** (Next.js): Delivers server-rendered pages to users
* **Admin application** (PHP): Provides merchant dashboard for order management

Enable autoscaling on each application with different thresholds:

* API: 70% scale-up (CPU-intensive data processing), minimum 2 instances
* Frontend: 80% scale-up (lighter workload), minimum 2 instances
* Admin: Manual scaling only (predictable load from internal users)

During a marketing campaign, the frontend and API scale independently based on their respective loads. The admin application maintains fixed capacity since merchant activity doesn't correlate with customer traffic.

## Limitations and current support

Autoscaling currently supports:

* Application containers (PHP, Node.js, Python, Go, Java, Ruby, .NET)
* CPU-based triggers
* Upsun Flex product tier
* All environment types (development, staging, production)

Autoscaling does not support:

* Services (databases, caches, search indexes)
* Worker containers and background job queues
* Memory-based triggers (planned for future release)
* Scaling to zero instances

## Related resources

**Configuration and management**:

* [Resource configuration](https://docs.upsun.com/manage-resources/adjust-resources.html)
* [Resource initialization strategies](https://docs.upsun.com/manage-resources/resource-init.html)
* [Manual horizontal scaling](https://docs.upsun.com/manage-resources/adjust-resources.html#horizontal-scaling)

**Monitoring and observability**:

* [Infrastructure metrics](https://docs.upsun.com/increase-observability/metrics.html)
* [Application performance monitoring](https://docs.upsun.com/increase-observability/application-metrics.html)
* [Blackfire integration](https://docs.upsun.com/increase-observability/application-metrics/blackfire.html)

**Cost management**:

* [Monitor billing](https://docs.upsun.com/administration/billing/bp-monitor-billing.html)
* [Upsun pricing](https://www.upsun.com/pricing/)

***

**Get started with autoscaling**:

Create a free Upsun account at [upsun.com](https://upsun.com) and enable autoscaling on your first project. Configure thresholds based on your application's performance characteristics, then monitor scaling behavior through the Console metrics dashboard. Adjust settings as you learn your application's patterns, finding the balance between performance, stability, and cost that works for your specific workload.