virt/kvm/arm/vgic.c

   1 /*
   2  * Copyright (C) 2012 ARM Ltd.
   3  * Author: Marc Zyngier <marc.zyngier@arm.com>
   4  *
   5  * This program is free software; you can redistribute it and/or modify
   6  * it under the terms of the GNU General Public License version 2 as
   7  * published by the Free Software Foundation.
   8  *
   9  * This program is distributed in the hope that it will be useful,
  10  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  11  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  12  * GNU General Public License for more details.
  13  *
  14  * You should have received a copy of the GNU General Public License
  15  * along with this program; if not, write to the Free Software
  16  * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
  17  */
  18
  19 #include <linux/cpu.h>
  20 #include <linux/kvm.h>
  21 #include <linux/kvm_host.h>
  22 #include <linux/interrupt.h>
  23 #include <linux/io.h>
  24 #include <linux/of.h>
  25 #include <linux/of_address.h>
  26 #include <linux/of_irq.h>
  27 #include <linux/rculist.h>
  28 #include <linux/uaccess.h>
  29
  30 #include <asm/kvm_emulate.h>
  31 #include <asm/kvm_arm.h>
  32 #include <asm/kvm_mmu.h>
  33 #include <trace/events/kvm.h>
  34 #include <asm/kvm.h>
  35 #include <kvm/iodev.h>
  36
  37 /*
  38  * How the whole thing works (courtesy of Christoffer Dall):
  39  *
  40  * - At any time, the dist->irq_pending_on_cpu is the oracle that knows if
  41  *   something is pending on the CPU interface.
  42  * - Interrupts that are pending on the distributor are stored on the
  43  *   vgic.irq_pending vgic bitmap (this bitmap is updated by both user land
  44  *   ioctls and guest mmio ops, and other in-kernel peripherals such as the
  45  *   arch. timers).
  46  * - Every time the bitmap changes, the irq_pending_on_cpu oracle is
  47  *   recalculated
  48  * - To calculate the oracle, we need info for each cpu from
  49  *   compute_pending_for_cpu, which considers:
  50  *   - PPI: dist->irq_pending & dist->irq_enable
  51  *   - SPI: dist->irq_pending & dist->irq_enable & dist->irq_spi_target
  52  *   - irq_spi_target is a 'formatted' version of the GICD_ITARGETSRn
  53  *     registers, stored on each vcpu. We only keep one bit of
  54  *     information per interrupt, making sure that only one vcpu can
  55  *     accept the interrupt.
  56  * - If any of the above state changes, we must recalculate the oracle.
  57  * - The same is true when injecting an interrupt, except that we only
  58  *   consider a single interrupt at a time. The irq_spi_cpu array
  59  *   contains the target CPU for each SPI.
  60  *
  61  * The handling of level interrupts adds some extra complexity. We
  62  * need to track when the interrupt has been EOIed, so we can sample
  63  * the 'line' again. This is achieved as such:
  64  *
  65  * - When a level interrupt is moved onto a vcpu, the corresponding
  66  *   bit in irq_queued is set. As long as this bit is set, the line
  67  *   will be ignored for further interrupts. The interrupt is injected
  68  *   into the vcpu with the GICH_LR_EOI bit set (generate a
  69  *   maintenance interrupt on EOI).
  70  * - When the interrupt is EOIed, the maintenance interrupt fires,
  71  *   and clears the corresponding bit in irq_queued. This allows the
  72  *   interrupt line to be sampled again.
  73  * - Note that level-triggered interrupts can also be set to pending from
  74  *   writes to GICD_ISPENDRn and lowering the external input line does not
  75  *   cause the interrupt to become inactive in such a situation.
  76  *   Conversely, writes to GICD_ICPENDRn do not cause the interrupt to become
  77  *   inactive as long as the external input line is held high.
  78  *
  79  *
  80  * Initialization rules: there are multiple stages to the vgic
  81  * initialization, both for the distributor and the CPU interfaces.
  82  *
  83  * Distributor:
  84  *
  85  * - kvm_vgic_early_init(): initialization of static data that doesn't
  86  *   depend on any sizing information or emulation type. No allocation
  87  *   is allowed there.
  88  *
  89  * - vgic_init(): allocation and initialization of the generic data
  90  *   structures that depend on sizing information (number of CPUs,
  91  *   number of interrupts). Also initializes the vcpu specific data
  92  *   structures. Can be executed lazily for GICv2.
  93  *   [to be renamed to kvm_vgic_init??]
  94  *
  95  * CPU Interface:
  96  *
  97  * - kvm_vgic_cpu_early_init(): initialization of static data that
  98  *   doesn't depend on any sizing information or emulation type. No
  99  *   allocation is allowed there.
 100  */
 101
 102 #include "vgic.h"
 103
 104 static void vgic_retire_disabled_irqs(struct kvm_vcpu *vcpu);
 105 static void vgic_retire_lr(int lr_nr, int irq, struct kvm_vcpu *vcpu);
 106 static struct vgic_lr vgic_get_lr(const struct kvm_vcpu *vcpu, int lr);
 107 static void vgic_set_lr(struct kvm_vcpu *vcpu, int lr, struct vgic_lr lr_desc);
 108 static struct irq_phys_map *vgic_irq_map_search(struct kvm_vcpu *vcpu,
 109                                                 int virt_irq);
 110 static int compute_pending_for_cpu(struct kvm_vcpu *vcpu);
 111
 112 static const struct vgic_ops *vgic_ops;
 113 static const struct vgic_params *vgic;
 114
 115 static void add_sgi_source(struct kvm_vcpu *vcpu, int irq, int source)
 116 {
 117         vcpu->kvm->arch.vgic.vm_ops.add_sgi_source(vcpu, irq, source);
 118 }
 119
 120 static bool queue_sgi(struct kvm_vcpu *vcpu, int irq)
 121 {
 122         return vcpu->kvm->arch.vgic.vm_ops.queue_sgi(vcpu, irq);
 123 }
 124
 125 int kvm_vgic_map_resources(struct kvm *kvm)
 126 {
 127         return kvm->arch.vgic.vm_ops.map_resources(kvm, vgic);
 128 }
 129
 130 /*
 131  * struct vgic_bitmap contains a bitmap made of unsigned longs, but
 132  * extracts u32s out of them.
 133  *
 134  * This does not work on 64-bit BE systems, because the bitmap access
 135  * will store two consecutive 32-bit words with the higher-addressed
 136  * register's bits at the lower index and the lower-addressed register's
 137  * bits at the higher index.
 138  *
 139  * Therefore, swizzle the register index when accessing the 32-bit word
 140  * registers to access the right register's value.
 141  */
 142 #if defined(CONFIG_CPU_BIG_ENDIAN) && BITS_PER_LONG == 64
 143 #define REG_OFFSET_SWIZZLE      1
 144 #else
 145 #define REG_OFFSET_SWIZZLE      0
 146 #endif
 147
 148 static int vgic_init_bitmap(struct vgic_bitmap *b, int nr_cpus, int nr_irqs)
 149 {
 150         int nr_longs;
 151
 152         nr_longs = nr_cpus + BITS_TO_LONGS(nr_irqs - VGIC_NR_PRIVATE_IRQS);
 153
 154         b->private = kzalloc(sizeof(unsigned long) * nr_longs, GFP_KERNEL);
 155         if (!b->private)
 156                 return -ENOMEM;
 157
 158         b->shared = b->private + nr_cpus;
 159
 160         return 0;
 161 }
 162
 163 static void vgic_free_bitmap(struct vgic_bitmap *b)
 164 {
 165         kfree(b->private);
 166         b->private = NULL;
 167         b->shared = NULL;
 168 }
 169
 170 /*
 171  * Call this function to convert a u64 value to an unsigned long * bitmask
 172  * in a way that works on both 32-bit and 64-bit LE and BE platforms.
 173  *
 174  * Warning: Calling this function may modify *val.
 175  */
 176 static unsigned long *u64_to_bitmask(u64 *val)
 177 {
 178 #if defined(CONFIG_CPU_BIG_ENDIAN) && BITS_PER_LONG == 32
 179         *val = (*val >> 32) | (*val << 32);
 180 #endif
 181         return (unsigned long *)val;
 182 }
 183
 184 u32 *vgic_bitmap_get_reg(struct vgic_bitmap *x, int cpuid, u32 offset)
 185 {
 186         offset >>= 2;
 187         if (!offset)
 188                 return (u32 *)(x->private + cpuid) + REG_OFFSET_SWIZZLE;
 189         else
 190                 return (u32 *)(x->shared) + ((offset - 1) ^ REG_OFFSET_SWIZZLE);
 191 }
 192
 193 static int vgic_bitmap_get_irq_val(struct vgic_bitmap *x,
 194                                    int cpuid, int irq)
 195 {
 196         if (irq < VGIC_NR_PRIVATE_IRQS)
 197                 return test_bit(irq, x->private + cpuid);
 198
 199         return test_bit(irq - VGIC_NR_PRIVATE_IRQS, x->shared);
 200 }
 201
 202 void vgic_bitmap_set_irq_val(struct vgic_bitmap *x, int cpuid,
 203                              int irq, int val)
 204 {
 205         unsigned long *reg;
 206
 207         if (irq < VGIC_NR_PRIVATE_IRQS) {
 208                 reg = x->private + cpuid;
 209         } else {
 210                 reg = x->shared;
 211                 irq -= VGIC_NR_PRIVATE_IRQS;
 212         }
 213
 214         if (val)
 215                 set_bit(irq, reg);
 216         else
 217                 clear_bit(irq, reg);
 218 }
 219
 220 static unsigned long *vgic_bitmap_get_cpu_map(struct vgic_bitmap *x, int cpuid)
 221 {
 222         return x->private + cpuid;
 223 }
 224
 225 unsigned long *vgic_bitmap_get_shared_map(struct vgic_bitmap *x)
 226 {
 227         return x->shared;
 228 }
 229
 230 static int vgic_init_bytemap(struct vgic_bytemap *x, int nr_cpus, int nr_irqs)
 231 {
 232         int size;
 233
 234         size  = nr_cpus * VGIC_NR_PRIVATE_IRQS;
 235         size += nr_irqs - VGIC_NR_PRIVATE_IRQS;
 236
 237         x->private = kzalloc(size, GFP_KERNEL);
 238         if (!x->private)
 239                 return -ENOMEM;
 240
 241         x->shared = x->private + nr_cpus * VGIC_NR_PRIVATE_IRQS / sizeof(u32);
 242         return 0;
 243 }
 244
 245 static void vgic_free_bytemap(struct vgic_bytemap *b)
 246 {
 247         kfree(b->private);
 248         b->private = NULL;
 249         b->shared = NULL;
 250 }
 251
 252 u32 *vgic_bytemap_get_reg(struct vgic_bytemap *x, int cpuid, u32 offset)
 253 {
 254         u32 *reg;
 255
 256         if (offset < VGIC_NR_PRIVATE_IRQS) {
 257                 reg = x->private;
 258                 offset += cpuid * VGIC_NR_PRIVATE_IRQS;
 259         } else {
 260                 reg = x->shared;
 261                 offset -= VGIC_NR_PRIVATE_IRQS;
 262         }
 263
 264         return reg + (offset / sizeof(u32));
 265 }
 266
 267 #define VGIC_CFG_LEVEL  0
 268 #define VGIC_CFG_EDGE   1
 269
 270 static bool vgic_irq_is_edge(struct kvm_vcpu *vcpu, int irq)
 271 {
 272         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
 273         int irq_val;
 274
 275         irq_val = vgic_bitmap_get_irq_val(&dist->irq_cfg, vcpu->vcpu_id, irq);
 276         return irq_val == VGIC_CFG_EDGE;
 277 }
 278
 279 static int vgic_irq_is_enabled(struct kvm_vcpu *vcpu, int irq)
 280 {
 281         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
 282
 283         return vgic_bitmap_get_irq_val(&dist->irq_enabled, vcpu->vcpu_id, irq);
 284 }
 285
 286 static int vgic_irq_is_queued(struct kvm_vcpu *vcpu, int irq)
 287 {
 288         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
 289
 290         return vgic_bitmap_get_irq_val(&dist->irq_queued, vcpu->vcpu_id, irq);
 291 }
 292
 293 static int vgic_irq_is_active(struct kvm_vcpu *vcpu, int irq)
 294 {
 295         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
 296
 297         return vgic_bitmap_get_irq_val(&dist->irq_active, vcpu->vcpu_id, irq);
 298 }
 299
 300 static void vgic_irq_set_queued(struct kvm_vcpu *vcpu, int irq)
 301 {
 302         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
 303
 304         vgic_bitmap_set_irq_val(&dist->irq_queued, vcpu->vcpu_id, irq, 1);
 305 }
 306
 307 static void vgic_irq_clear_queued(struct kvm_vcpu *vcpu, int irq)
 308 {
 309         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
 310
 311         vgic_bitmap_set_irq_val(&dist->irq_queued, vcpu->vcpu_id, irq, 0);
 312 }
 313
 314 static void vgic_irq_set_active(struct kvm_vcpu *vcpu, int irq)
 315 {
 316         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
 317
 318         vgic_bitmap_set_irq_val(&dist->irq_active, vcpu->vcpu_id, irq, 1);
 319 }
 320
 321 static void vgic_irq_clear_active(struct kvm_vcpu *vcpu, int irq)
 322 {
 323         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
 324
 325         vgic_bitmap_set_irq_val(&dist->irq_active, vcpu->vcpu_id, irq, 0);
 326 }
 327
 328 static int vgic_dist_irq_get_level(struct kvm_vcpu *vcpu, int irq)
 329 {
 330         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
 331
 332         return vgic_bitmap_get_irq_val(&dist->irq_level, vcpu->vcpu_id, irq);
 333 }
 334
 335 static void vgic_dist_irq_set_level(struct kvm_vcpu *vcpu, int irq)
 336 {
 337         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
 338
 339         vgic_bitmap_set_irq_val(&dist->irq_level, vcpu->vcpu_id, irq, 1);
 340 }
 341
 342 static void vgic_dist_irq_clear_level(struct kvm_vcpu *vcpu, int irq)
 343 {
 344         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
 345
 346         vgic_bitmap_set_irq_val(&dist->irq_level, vcpu->vcpu_id, irq, 0);
 347 }
 348
 349 static int vgic_dist_irq_soft_pend(struct kvm_vcpu *vcpu, int irq)
 350 {
 351         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
 352
 353         return vgic_bitmap_get_irq_val(&dist->irq_soft_pend, vcpu->vcpu_id, irq);
 354 }
 355
 356 static void vgic_dist_irq_clear_soft_pend(struct kvm_vcpu *vcpu, int irq)
 357 {
 358         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
 359
 360         vgic_bitmap_set_irq_val(&dist->irq_soft_pend, vcpu->vcpu_id, irq, 0);
 361         if (!vgic_dist_irq_get_level(vcpu, irq)) {
 362                 vgic_dist_irq_clear_pending(vcpu, irq);
 363                 if (!compute_pending_for_cpu(vcpu))
 364                         clear_bit(vcpu->vcpu_id, dist->irq_pending_on_cpu);
 365         }
 366 }
 367
 368 static int vgic_dist_irq_is_pending(struct kvm_vcpu *vcpu, int irq)
 369 {
 370         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
 371
 372         return vgic_bitmap_get_irq_val(&dist->irq_pending, vcpu->vcpu_id, irq);
 373 }
 374
 375 void vgic_dist_irq_set_pending(struct kvm_vcpu *vcpu, int irq)
 376 {
 377         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
 378
 379         vgic_bitmap_set_irq_val(&dist->irq_pending, vcpu->vcpu_id, irq, 1);
 380 }
 381
 382 void vgic_dist_irq_clear_pending(struct kvm_vcpu *vcpu, int irq)
 383 {
 384         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
 385
 386         vgic_bitmap_set_irq_val(&dist->irq_pending, vcpu->vcpu_id, irq, 0);
 387 }
 388
 389 static void vgic_cpu_irq_set(struct kvm_vcpu *vcpu, int irq)
 390 {
 391         if (irq < VGIC_NR_PRIVATE_IRQS)
 392                 set_bit(irq, vcpu->arch.vgic_cpu.pending_percpu);
 393         else
 394                 set_bit(irq - VGIC_NR_PRIVATE_IRQS,
 395                         vcpu->arch.vgic_cpu.pending_shared);
 396 }
 397
 398 void vgic_cpu_irq_clear(struct kvm_vcpu *vcpu, int irq)
 399 {
 400         if (irq < VGIC_NR_PRIVATE_IRQS)
 401                 clear_bit(irq, vcpu->arch.vgic_cpu.pending_percpu);
 402         else
 403                 clear_bit(irq - VGIC_NR_PRIVATE_IRQS,
 404                           vcpu->arch.vgic_cpu.pending_shared);
 405 }
 406
 407 static bool vgic_can_sample_irq(struct kvm_vcpu *vcpu, int irq)
 408 {
 409         return !vgic_irq_is_queued(vcpu, irq);
 410 }
 411
 412 /**
 413  * vgic_reg_access - access vgic register
 414  * @mmio:   pointer to the data describing the mmio access
 415  * @reg:    pointer to the virtual backing of vgic distributor data
 416  * @offset: least significant 2 bits used for word offset
 417  * @mode:   ACCESS_ mode (see defines above)
 418  *
 419  * Helper to make vgic register access easier using one of the access
 420  * modes defined for vgic register access
 421  * (read,raz,write-ignored,setbit,clearbit,write)
 422  */
 423 void vgic_reg_access(struct kvm_exit_mmio *mmio, u32 *reg,
 424                      phys_addr_t offset, int mode)
 425 {
 426         int word_offset = (offset & 3) * 8;
 427         u32 mask = (1UL << (mmio->len * 8)) - 1;
 428         u32 regval;
 429
 430         /*
 431          * Any alignment fault should have been delivered to the guest
 432          * directly (ARM ARM B3.12.7 "Prioritization of aborts").
 433          */
 434
 435         if (reg) {
 436                 regval = *reg;
 437         } else {
 438                 BUG_ON(mode != (ACCESS_READ_RAZ | ACCESS_WRITE_IGNORED));
 439                 regval = 0;
 440         }
 441
 442         if (mmio->is_write) {
 443                 u32 data = mmio_data_read(mmio, mask) << word_offset;
 444                 switch (ACCESS_WRITE_MASK(mode)) {
 445                 case ACCESS_WRITE_IGNORED:
 446                         return;
 447
 448                 case ACCESS_WRITE_SETBIT:
 449                         regval |= data;
 450                         break;
 451
 452                 case ACCESS_WRITE_CLEARBIT:
 453                         regval &= ~data;
 454                         break;
 455
 456                 case ACCESS_WRITE_VALUE:
 457                         regval = (regval & ~(mask << word_offset)) | data;
 458                         break;
 459                 }
 460                 *reg = regval;
 461         } else {
 462                 switch (ACCESS_READ_MASK(mode)) {
 463                 case ACCESS_READ_RAZ:
 464                         regval = 0;
 465                         /* fall through */
 466
 467                 case ACCESS_READ_VALUE:
 468                         mmio_data_write(mmio, mask, regval >> word_offset);
 469                 }
 470         }
 471 }
 472
 473 bool handle_mmio_raz_wi(struct kvm_vcpu *vcpu, struct kvm_exit_mmio *mmio,
 474                         phys_addr_t offset)
 475 {
 476         vgic_reg_access(mmio, NULL, offset,
 477                         ACCESS_READ_RAZ | ACCESS_WRITE_IGNORED);
 478         return false;
 479 }
 480
 481 bool vgic_handle_enable_reg(struct kvm *kvm, struct kvm_exit_mmio *mmio,
 482                             phys_addr_t offset, int vcpu_id, int access)
 483 {
 484         u32 *reg;
 485         int mode = ACCESS_READ_VALUE | access;
 486         struct kvm_vcpu *target_vcpu = kvm_get_vcpu(kvm, vcpu_id);
 487
 488         reg = vgic_bitmap_get_reg(&kvm->arch.vgic.irq_enabled, vcpu_id, offset);
 489         vgic_reg_access(mmio, reg, offset, mode);
 490         if (mmio->is_write) {
 491                 if (access & ACCESS_WRITE_CLEARBIT) {
 492                         if (offset < 4) /* Force SGI enabled */
 493                                 *reg |= 0xffff;
 494                         vgic_retire_disabled_irqs(target_vcpu);
 495                 }
 496                 vgic_update_state(kvm);
 497                 return true;
 498         }
 499
 500         return false;
 501 }
 502
 503 bool vgic_handle_set_pending_reg(struct kvm *kvm,
 504                                  struct kvm_exit_mmio *mmio,
 505                                  phys_addr_t offset, int vcpu_id)
 506 {
 507         u32 *reg, orig;
 508         u32 level_mask;
 509         int mode = ACCESS_READ_VALUE | ACCESS_WRITE_SETBIT;
 510         struct vgic_dist *dist = &kvm->arch.vgic;
 511
 512         reg = vgic_bitmap_get_reg(&dist->irq_cfg, vcpu_id, offset);
 513         level_mask = (~(*reg));
 514
 515         /* Mark both level and edge triggered irqs as pending */
 516         reg = vgic_bitmap_get_reg(&dist->irq_pending, vcpu_id, offset);
 517         orig = *reg;
 518         vgic_reg_access(mmio, reg, offset, mode);
 519
 520         if (mmio->is_write) {
 521                 /* Set the soft-pending flag only for level-triggered irqs */
 522                 reg = vgic_bitmap_get_reg(&dist->irq_soft_pend,
 523                                           vcpu_id, offset);
 524                 vgic_reg_access(mmio, reg, offset, mode);
 525                 *reg &= level_mask;
 526
 527                 /* Ignore writes to SGIs */
 528                 if (offset < 2) {
 529                         *reg &= ~0xffff;
 530                         *reg |= orig & 0xffff;
 531                 }
 532
 533                 vgic_update_state(kvm);
 534                 return true;
 535         }
 536
 537         return false;
 538 }
 539
 540 /*
 541  * If a mapped interrupt's state has been modified by the guest such that it
 542  * is no longer active or pending, without it have gone through the sync path,
 543  * then the map->active field must be cleared so the interrupt can be taken
 544  * again.
 545  */
 546 static void vgic_handle_clear_mapped_irq(struct kvm_vcpu *vcpu)
 547 {
 548         struct vgic_cpu *vgic_cpu = &vcpu->arch.vgic_cpu;
 549         struct list_head *root;
 550         struct irq_phys_map_entry *entry;
 551         struct irq_phys_map *map;
 552
 553         rcu_read_lock();
 554
 555         /* Check for PPIs */
 556         root = &vgic_cpu->irq_phys_map_list;
 557         list_for_each_entry_rcu(entry, root, entry) {
 558                 map = &entry->map;
 559
 560                 if (!vgic_dist_irq_is_pending(vcpu, map->virt_irq) &&
 561                     !vgic_irq_is_active(vcpu, map->virt_irq))
 562                         map->active = false;
 563         }
 564
 565         rcu_read_unlock();
 566 }
 567
 568 bool vgic_handle_clear_pending_reg(struct kvm *kvm,
 569                                    struct kvm_exit_mmio *mmio,
 570                                    phys_addr_t offset, int vcpu_id)
 571 {
 572         u32 *level_active;
 573         u32 *reg, orig;
 574         int mode = ACCESS_READ_VALUE | ACCESS_WRITE_CLEARBIT;
 575         struct vgic_dist *dist = &kvm->arch.vgic;
 576
 577         reg = vgic_bitmap_get_reg(&dist->irq_pending, vcpu_id, offset);
 578         orig = *reg;
 579         vgic_reg_access(mmio, reg, offset, mode);
 580         if (mmio->is_write) {
 581                 /* Re-set level triggered level-active interrupts */
 582                 level_active = vgic_bitmap_get_reg(&dist->irq_level,
 583                                           vcpu_id, offset);
 584                 reg = vgic_bitmap_get_reg(&dist->irq_pending, vcpu_id, offset);
 585                 *reg |= *level_active;
 586
 587                 /* Ignore writes to SGIs */
 588                 if (offset < 2) {
 589                         *reg &= ~0xffff;
 590                         *reg |= orig & 0xffff;
 591                 }
 592
 593                 /* Clear soft-pending flags */
 594                 reg = vgic_bitmap_get_reg(&dist->irq_soft_pend,
 595                                           vcpu_id, offset);
 596                 vgic_reg_access(mmio, reg, offset, mode);
 597
 598                 vgic_handle_clear_mapped_irq(kvm_get_vcpu(kvm, vcpu_id));
 599                 vgic_update_state(kvm);
 600                 return true;
 601         }
 602         return false;
 603 }
 604
 605 bool vgic_handle_set_active_reg(struct kvm *kvm,
 606                                 struct kvm_exit_mmio *mmio,
 607                                 phys_addr_t offset, int vcpu_id)
 608 {
 609         u32 *reg;
 610         struct vgic_dist *dist = &kvm->arch.vgic;
 611
 612         reg = vgic_bitmap_get_reg(&dist->irq_active, vcpu_id, offset);
 613         vgic_reg_access(mmio, reg, offset,
 614                         ACCESS_READ_VALUE | ACCESS_WRITE_SETBIT);
 615
 616         if (mmio->is_write) {
 617                 vgic_update_state(kvm);
 618                 return true;
 619         }
 620
 621         return false;
 622 }
 623
 624 bool vgic_handle_clear_active_reg(struct kvm *kvm,
 625                                   struct kvm_exit_mmio *mmio,
 626                                   phys_addr_t offset, int vcpu_id)
 627 {
 628         u32 *reg;
 629         struct vgic_dist *dist = &kvm->arch.vgic;
 630
 631         reg = vgic_bitmap_get_reg(&dist->irq_active, vcpu_id, offset);
 632         vgic_reg_access(mmio, reg, offset,
 633                         ACCESS_READ_VALUE | ACCESS_WRITE_CLEARBIT);
 634
 635         if (mmio->is_write) {
 636                 vgic_handle_clear_mapped_irq(kvm_get_vcpu(kvm, vcpu_id));
 637                 vgic_update_state(kvm);
 638                 return true;
 639         }
 640
 641         return false;
 642 }
 643
 644 static u32 vgic_cfg_expand(u16 val)
 645 {
 646         u32 res = 0;
 647         int i;
 648
 649         /*
 650          * Turn a 16bit value like abcd...mnop into a 32bit word
 651          * a0b0c0d0...m0n0o0p0, which is what the HW cfg register is.
 652          */
 653         for (i = 0; i < 16; i++)
 654                 res |= ((val >> i) & VGIC_CFG_EDGE) << (2 * i + 1);
 655
 656         return res;
 657 }
 658
 659 static u16 vgic_cfg_compress(u32 val)
 660 {
 661         u16 res = 0;
 662         int i;
 663
 664         /*
 665          * Turn a 32bit word a0b0c0d0...m0n0o0p0 into 16bit value like
 666          * abcd...mnop which is what we really care about.
 667          */
 668         for (i = 0; i < 16; i++)
 669                 res |= ((val >> (i * 2 + 1)) & VGIC_CFG_EDGE) << i;
 670
 671         return res;
 672 }
 673
 674 /*
 675  * The distributor uses 2 bits per IRQ for the CFG register, but the
 676  * LSB is always 0. As such, we only keep the upper bit, and use the
 677  * two above functions to compress/expand the bits
 678  */
 679 bool vgic_handle_cfg_reg(u32 *reg, struct kvm_exit_mmio *mmio,
 680                          phys_addr_t offset)
 681 {
 682         u32 val;
 683
 684         if (offset & 4)
 685                 val = *reg >> 16;
 686         else
 687                 val = *reg & 0xffff;
 688
 689         val = vgic_cfg_expand(val);
 690         vgic_reg_access(mmio, &val, offset,
 691                         ACCESS_READ_VALUE | ACCESS_WRITE_VALUE);
 692         if (mmio->is_write) {
 693                 if (offset < 8) {
 694                         *reg = ~0U; /* Force PPIs/SGIs to 1 */
 695                         return false;
 696                 }
 697
 698                 val = vgic_cfg_compress(val);
 699                 if (offset & 4) {
 700                         *reg &= 0xffff;
 701                         *reg |= val << 16;
 702                 } else {
 703                         *reg &= 0xffff << 16;
 704                         *reg |= val;
 705                 }
 706         }
 707
 708         return false;
 709 }
 710
 711 /**
 712  * vgic_unqueue_irqs - move pending/active IRQs from LRs to the distributor
 713  * @vgic_cpu: Pointer to the vgic_cpu struct holding the LRs
 714  *
 715  * Move any IRQs that have already been assigned to LRs back to the
 716  * emulated distributor state so that the complete emulated state can be read
 717  * from the main emulation structures without investigating the LRs.
 718  */
 719 void vgic_unqueue_irqs(struct kvm_vcpu *vcpu)
 720 {
 721         struct vgic_cpu *vgic_cpu = &vcpu->arch.vgic_cpu;
 722         int i;
 723
 724         for_each_set_bit(i, vgic_cpu->lr_used, vgic_cpu->nr_lr) {
 725                 struct vgic_lr lr = vgic_get_lr(vcpu, i);
 726
 727                 /*
 728                  * There are three options for the state bits:
 729                  *
 730                  * 01: pending
 731                  * 10: active
 732                  * 11: pending and active
 733                  */
 734                 BUG_ON(!(lr.state & LR_STATE_MASK));
 735
 736                 /* Reestablish SGI source for pending and active IRQs */
 737                 if (lr.irq < VGIC_NR_SGIS)
 738                         add_sgi_source(vcpu, lr.irq, lr.source);
 739
 740                 /*
 741                  * If the LR holds an active (10) or a pending and active (11)
 742                  * interrupt then move the active state to the
 743                  * distributor tracking bit.
 744                  */
 745                 if (lr.state & LR_STATE_ACTIVE) {
 746                         vgic_irq_set_active(vcpu, lr.irq);
 747                         lr.state &= ~LR_STATE_ACTIVE;
 748                 }
 749
 750                 /*
 751                  * Reestablish the pending state on the distributor and the
 752                  * CPU interface.  It may have already been pending, but that
 753                  * is fine, then we are only setting a few bits that were
 754                  * already set.
 755                  */
 756                 if (lr.state & LR_STATE_PENDING) {
 757                         vgic_dist_irq_set_pending(vcpu, lr.irq);
 758                         lr.state &= ~LR_STATE_PENDING;
 759                 }
 760
 761                 vgic_set_lr(vcpu, i, lr);
 762
 763                 /*
 764                  * Mark the LR as free for other use.
 765                  */
 766                 BUG_ON(lr.state & LR_STATE_MASK);
 767                 vgic_retire_lr(i, lr.irq, vcpu);
 768                 vgic_irq_clear_queued(vcpu, lr.irq);
 769
 770                 /* Finally update the VGIC state. */
 771                 vgic_update_state(vcpu->kvm);
 772         }
 773 }
 774
 775 const
 776 struct vgic_io_range *vgic_find_range(const struct vgic_io_range *ranges,
 777                                       int len, gpa_t offset)
 778 {
 779         while (ranges->len) {
 780                 if (offset >= ranges->base &&
 781                     (offset + len) <= (ranges->base + ranges->len))
 782                         return ranges;
 783                 ranges++;
 784         }
 785
 786         return NULL;
 787 }
 788
 789 static bool vgic_validate_access(const struct vgic_dist *dist,
 790                                  const struct vgic_io_range *range,
 791                                  unsigned long offset)
 792 {
 793         int irq;
 794
 795         if (!range->bits_per_irq)
 796                 return true;    /* Not an irq-based access */
 797
 798         irq = offset * 8 / range->bits_per_irq;
 799         if (irq >= dist->nr_irqs)
 800                 return false;
 801
 802         return true;
 803 }
 804
 805 /*
 806  * Call the respective handler function for the given range.
 807  * We split up any 64 bit accesses into two consecutive 32 bit
 808  * handler calls and merge the result afterwards.
 809  * We do this in a little endian fashion regardless of the host's
 810  * or guest's endianness, because the GIC is always LE and the rest of
 811  * the code (vgic_reg_access) also puts it in a LE fashion already.
 812  * At this point we have already identified the handle function, so
 813  * range points to that one entry and offset is relative to this.
 814  */
 815 static bool call_range_handler(struct kvm_vcpu *vcpu,
 816                                struct kvm_exit_mmio *mmio,
 817                                unsigned long offset,
 818                                const struct vgic_io_range *range)
 819 {
 820         struct kvm_exit_mmio mmio32;
 821         bool ret;
 822
 823         if (likely(mmio->len <= 4))
 824                 return range->handle_mmio(vcpu, mmio, offset);
 825
 826         /*
 827          * Any access bigger than 4 bytes (that we currently handle in KVM)
 828          * is actually 8 bytes long, caused by a 64-bit access
 829          */
 830
 831         mmio32.len = 4;
 832         mmio32.is_write = mmio->is_write;
 833         mmio32.private = mmio->private;
 834
 835         mmio32.phys_addr = mmio->phys_addr + 4;
 836         mmio32.data = &((u32 *)mmio->data)[1];
 837         ret = range->handle_mmio(vcpu, &mmio32, offset + 4);
 838
 839         mmio32.phys_addr = mmio->phys_addr;
 840         mmio32.data = &((u32 *)mmio->data)[0];
 841         ret |= range->handle_mmio(vcpu, &mmio32, offset);
 842
 843         return ret;
 844 }
 845
 846 /**
 847  * vgic_handle_mmio_access - handle an in-kernel MMIO access
 848  * This is called by the read/write KVM IO device wrappers below.
 849  * @vcpu:       pointer to the vcpu performing the access
 850  * @this:       pointer to the KVM IO device in charge
 851  * @addr:       guest physical address of the access
 852  * @len:        size of the access
 853  * @val:        pointer to the data region
 854  * @is_write:   read or write access
 855  *
 856  * returns true if the MMIO access could be performed
 857  */
 858 static int vgic_handle_mmio_access(struct kvm_vcpu *vcpu,
 859                                    struct kvm_io_device *this, gpa_t addr,
 860                                    int len, void *val, bool is_write)
 861 {
 862         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
 863         struct vgic_io_device *iodev = container_of(this,
 864                                                     struct vgic_io_device, dev);
 865         struct kvm_run *run = vcpu->run;
 866         const struct vgic_io_range *range;
 867         struct kvm_exit_mmio mmio;
 868         bool updated_state;
 869         gpa_t offset;
 870
 871         offset = addr - iodev->addr;
 872         range = vgic_find_range(iodev->reg_ranges, len, offset);
 873         if (unlikely(!range || !range->handle_mmio)) {
 874                 pr_warn("Unhandled access %d %08llx %d\n", is_write, addr, len);
 875                 return -ENXIO;
 876         }
 877
 878         mmio.phys_addr = addr;
 879         mmio.len = len;
 880         mmio.is_write = is_write;
 881         mmio.data = val;
 882         mmio.private = iodev->redist_vcpu;
 883
 884         spin_lock(&dist->lock);
 885         offset -= range->base;
 886         if (vgic_validate_access(dist, range, offset)) {
 887                 updated_state = call_range_handler(vcpu, &mmio, offset, range);
 888         } else {
 889                 if (!is_write)
 890                         memset(val, 0, len);
 891                 updated_state = false;
 892         }
 893         spin_unlock(&dist->lock);
 894         run->mmio.is_write      = is_write;
 895         run->mmio.len           = len;
 896         run->mmio.phys_addr     = addr;
 897         memcpy(run->mmio.data, val, len);
 898
 899         kvm_handle_mmio_return(vcpu, run);
 900
 901         if (updated_state)
 902                 vgic_kick_vcpus(vcpu->kvm);
 903
 904         return 0;
 905 }
 906
 907 static int vgic_handle_mmio_read(struct kvm_vcpu *vcpu,
 908                                  struct kvm_io_device *this,
 909                                  gpa_t addr, int len, void *val)
 910 {
 911         return vgic_handle_mmio_access(vcpu, this, addr, len, val, false);
 912 }
 913
 914 static int vgic_handle_mmio_write(struct kvm_vcpu *vcpu,
 915                                   struct kvm_io_device *this,
 916                                   gpa_t addr, int len, const void *val)
 917 {
 918         return vgic_handle_mmio_access(vcpu, this, addr, len, (void *)val,
 919                                        true);
 920 }
 921
 922 struct kvm_io_device_ops vgic_io_ops = {
 923         .read   = vgic_handle_mmio_read,
 924         .write  = vgic_handle_mmio_write,
 925 };
 926
 927 /**
 928  * vgic_register_kvm_io_dev - register VGIC register frame on the KVM I/O bus
 929  * @kvm:            The VM structure pointer
 930  * @base:           The (guest) base address for the register frame
 931  * @len:            Length of the register frame window
 932  * @ranges:         Describing the handler functions for each register
 933  * @redist_vcpu_id: The VCPU ID to pass on to the handlers on call
 934  * @iodev:          Points to memory to be passed on to the handler
 935  *
 936  * @iodev stores the parameters of this function to be usable by the handler
 937  * respectively the dispatcher function (since the KVM I/O bus framework lacks
 938  * an opaque parameter). Initialization is done in this function, but the
 939  * reference should be valid and unique for the whole VGIC lifetime.
 940  * If the register frame is not mapped for a specific VCPU, pass -1 to
 941  * @redist_vcpu_id.
 942  */
 943 int vgic_register_kvm_io_dev(struct kvm *kvm, gpa_t base, int len,
 944                              const struct vgic_io_range *ranges,
 945                              int redist_vcpu_id,
 946                              struct vgic_io_device *iodev)
 947 {
 948         struct kvm_vcpu *vcpu = NULL;
 949         int ret;
 950
 951         if (redist_vcpu_id >= 0)
 952                 vcpu = kvm_get_vcpu(kvm, redist_vcpu_id);
 953
 954         iodev->addr             = base;
 955         iodev->len              = len;
 956         iodev->reg_ranges       = ranges;
 957         iodev->redist_vcpu      = vcpu;
 958
 959         kvm_iodevice_init(&iodev->dev, &vgic_io_ops);
 960
 961         mutex_lock(&kvm->slots_lock);
 962
 963         ret = kvm_io_bus_register_dev(kvm, KVM_MMIO_BUS, base, len,
 964                                       &iodev->dev);
 965         mutex_unlock(&kvm->slots_lock);
 966
 967         /* Mark the iodev as invalid if registration fails. */
 968         if (ret)
 969                 iodev->dev.ops = NULL;
 970
 971         return ret;
 972 }
 973
 974 static int vgic_nr_shared_irqs(struct vgic_dist *dist)
 975 {
 976         return dist->nr_irqs - VGIC_NR_PRIVATE_IRQS;
 977 }
 978
 979 static int compute_active_for_cpu(struct kvm_vcpu *vcpu)
 980 {
 981         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
 982         unsigned long *active, *enabled, *act_percpu, *act_shared;
 983         unsigned long active_private, active_shared;
 984         int nr_shared = vgic_nr_shared_irqs(dist);
 985         int vcpu_id;
 986
 987         vcpu_id = vcpu->vcpu_id;
 988         act_percpu = vcpu->arch.vgic_cpu.active_percpu;
 989         act_shared = vcpu->arch.vgic_cpu.active_shared;
 990
 991         active = vgic_bitmap_get_cpu_map(&dist->irq_active, vcpu_id);
 992         enabled = vgic_bitmap_get_cpu_map(&dist->irq_enabled, vcpu_id);
 993         bitmap_and(act_percpu, active, enabled, VGIC_NR_PRIVATE_IRQS);
 994
 995         active = vgic_bitmap_get_shared_map(&dist->irq_active);
 996         enabled = vgic_bitmap_get_shared_map(&dist->irq_enabled);
 997         bitmap_and(act_shared, active, enabled, nr_shared);
 998         bitmap_and(act_shared, act_shared,
 999                    vgic_bitmap_get_shared_map(&dist->irq_spi_target[vcpu_id]),
1000                    nr_shared);
1001
1002         active_private = find_first_bit(act_percpu, VGIC_NR_PRIVATE_IRQS);
1003         active_shared = find_first_bit(act_shared, nr_shared);
1004
1005         return (active_private < VGIC_NR_PRIVATE_IRQS ||
1006                 active_shared < nr_shared);
1007 }
1008
1009 static int compute_pending_for_cpu(struct kvm_vcpu *vcpu)
1010 {
1011         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
1012         unsigned long *pending, *enabled, *pend_percpu, *pend_shared;
1013         unsigned long pending_private, pending_shared;
1014         int nr_shared = vgic_nr_shared_irqs(dist);
1015         int vcpu_id;
1016
1017         vcpu_id = vcpu->vcpu_id;
1018         pend_percpu = vcpu->arch.vgic_cpu.pending_percpu;
1019         pend_shared = vcpu->arch.vgic_cpu.pending_shared;
1020
1021         if (!dist->enabled) {
1022                 bitmap_zero(pend_percpu, VGIC_NR_PRIVATE_IRQS);
1023                 bitmap_zero(pend_shared, nr_shared);
1024                 return 0;
1025         }
1026
1027         pending = vgic_bitmap_get_cpu_map(&dist->irq_pending, vcpu_id);
1028         enabled = vgic_bitmap_get_cpu_map(&dist->irq_enabled, vcpu_id);
1029         bitmap_and(pend_percpu, pending, enabled, VGIC_NR_PRIVATE_IRQS);
1030
1031         pending = vgic_bitmap_get_shared_map(&dist->irq_pending);
1032         enabled = vgic_bitmap_get_shared_map(&dist->irq_enabled);
1033         bitmap_and(pend_shared, pending, enabled, nr_shared);
1034         bitmap_and(pend_shared, pend_shared,
1035                    vgic_bitmap_get_shared_map(&dist->irq_spi_target[vcpu_id]),
1036                    nr_shared);
1037
1038         pending_private = find_first_bit(pend_percpu, VGIC_NR_PRIVATE_IRQS);
1039         pending_shared = find_first_bit(pend_shared, nr_shared);
1040         return (pending_private < VGIC_NR_PRIVATE_IRQS ||
1041                 pending_shared < vgic_nr_shared_irqs(dist));
1042 }
1043
1044 /*
1045  * Update the interrupt state and determine which CPUs have pending
1046  * or active interrupts. Must be called with distributor lock held.
1047  */
1048 void vgic_update_state(struct kvm *kvm)
1049 {
1050         struct vgic_dist *dist = &kvm->arch.vgic;
1051         struct kvm_vcpu *vcpu;
1052         int c;
1053
1054         kvm_for_each_vcpu(c, vcpu, kvm) {
1055                 if (compute_pending_for_cpu(vcpu))
1056                         set_bit(c, dist->irq_pending_on_cpu);
1057
1058                 if (compute_active_for_cpu(vcpu))
1059                         set_bit(c, dist->irq_active_on_cpu);
1060                 else
1061                         clear_bit(c, dist->irq_active_on_cpu);
1062         }
1063 }
1064
1065 static struct vgic_lr vgic_get_lr(const struct kvm_vcpu *vcpu, int lr)
1066 {
1067         return vgic_ops->get_lr(vcpu, lr);
1068 }
1069
1070 static void vgic_set_lr(struct kvm_vcpu *vcpu, int lr,
1071                                struct vgic_lr vlr)
1072 {
1073         vgic_ops->set_lr(vcpu, lr, vlr);
1074 }
1075
1076 static void vgic_sync_lr_elrsr(struct kvm_vcpu *vcpu, int lr,
1077                                struct vgic_lr vlr)
1078 {
1079         vgic_ops->sync_lr_elrsr(vcpu, lr, vlr);
1080 }
1081
1082 static inline u64 vgic_get_elrsr(struct kvm_vcpu *vcpu)
1083 {
1084         return vgic_ops->get_elrsr(vcpu);
1085 }
1086
1087 static inline u64 vgic_get_eisr(struct kvm_vcpu *vcpu)
1088 {
1089         return vgic_ops->get_eisr(vcpu);
1090 }
1091
1092 static inline void vgic_clear_eisr(struct kvm_vcpu *vcpu)
1093 {
1094         vgic_ops->clear_eisr(vcpu);
1095 }
1096
1097 static inline u32 vgic_get_interrupt_status(struct kvm_vcpu *vcpu)
1098 {
1099         return vgic_ops->get_interrupt_status(vcpu);
1100 }
1101
1102 static inline void vgic_enable_underflow(struct kvm_vcpu *vcpu)
1103 {
1104         vgic_ops->enable_underflow(vcpu);
1105 }
1106
1107 static inline void vgic_disable_underflow(struct kvm_vcpu *vcpu)
1108 {
1109         vgic_ops->disable_underflow(vcpu);
1110 }
1111
1112 void vgic_get_vmcr(struct kvm_vcpu *vcpu, struct vgic_vmcr *vmcr)
1113 {
1114         vgic_ops->get_vmcr(vcpu, vmcr);
1115 }
1116
1117 void vgic_set_vmcr(struct kvm_vcpu *vcpu, struct vgic_vmcr *vmcr)
1118 {
1119         vgic_ops->set_vmcr(vcpu, vmcr);
1120 }
1121
1122 static inline void vgic_enable(struct kvm_vcpu *vcpu)
1123 {
1124         vgic_ops->enable(vcpu);
1125 }
1126
1127 static void vgic_retire_lr(int lr_nr, int irq, struct kvm_vcpu *vcpu)
1128 {
1129         struct vgic_cpu *vgic_cpu = &vcpu->arch.vgic_cpu;
1130         struct vgic_lr vlr = vgic_get_lr(vcpu, lr_nr);
1131
1132         /*
1133          * We must transfer the pending state back to the distributor before
1134          * retiring the LR, otherwise we may loose edge-triggered interrupts.
1135          */
1136         if (vlr.state & LR_STATE_PENDING) {
1137                 vgic_dist_irq_set_pending(vcpu, irq);
1138                 vlr.hwirq = 0;
1139         }
1140
1141         vlr.state = 0;
1142         vgic_set_lr(vcpu, lr_nr, vlr);
1143         clear_bit(lr_nr, vgic_cpu->lr_used);
1144         vgic_cpu->vgic_irq_lr_map[irq] = LR_EMPTY;
1145         vgic_sync_lr_elrsr(vcpu, lr_nr, vlr);
1146 }
1147
1148 /*
1149  * An interrupt may have been disabled after being made pending on the
1150  * CPU interface (the classic case is a timer running while we're
1151  * rebooting the guest - the interrupt would kick as soon as the CPU
1152  * interface gets enabled, with deadly consequences).
1153  *
1154  * The solution is to examine already active LRs, and check the
1155  * interrupt is still enabled. If not, just retire it.
1156  */
1157 static void vgic_retire_disabled_irqs(struct kvm_vcpu *vcpu)
1158 {
1159         struct vgic_cpu *vgic_cpu = &vcpu->arch.vgic_cpu;
1160         int lr;
1161
1162         for_each_set_bit(lr, vgic_cpu->lr_used, vgic->nr_lr) {
1163                 struct vgic_lr vlr = vgic_get_lr(vcpu, lr);
1164
1165                 if (!vgic_irq_is_enabled(vcpu, vlr.irq)) {
1166                         vgic_retire_lr(lr, vlr.irq, vcpu);
1167                         if (vgic_irq_is_queued(vcpu, vlr.irq))
1168                                 vgic_irq_clear_queued(vcpu, vlr.irq);
1169                 }
1170         }
1171 }
1172
1173 static void vgic_queue_irq_to_lr(struct kvm_vcpu *vcpu, int irq,
1174                                  int lr_nr, struct vgic_lr vlr)
1175 {
1176         if (vgic_irq_is_active(vcpu, irq)) {
1177                 vlr.state |= LR_STATE_ACTIVE;
1178                 kvm_debug("Set active, clear distributor: 0x%x\n", vlr.state);
1179                 vgic_irq_clear_active(vcpu, irq);
1180                 vgic_update_state(vcpu->kvm);
1181         } else {
1182                 WARN_ON(!vgic_dist_irq_is_pending(vcpu, irq));
1183                 vlr.state |= LR_STATE_PENDING;
1184                 kvm_debug("Set pending: 0x%x\n", vlr.state);
1185         }
1186
1187         if (!vgic_irq_is_edge(vcpu, irq))
1188                 vlr.state |= LR_EOI_INT;
1189
1190         if (vlr.irq >= VGIC_NR_SGIS) {
1191                 struct irq_phys_map *map;
1192                 map = vgic_irq_map_search(vcpu, irq);
1193
1194                 if (map) {
1195                         vlr.hwirq = map->phys_irq;
1196                         vlr.state |= LR_HW;
1197                         vlr.state &= ~LR_EOI_INT;
1198
1199                         /*
1200                          * Make sure we're not going to sample this
1201                          * again, as a HW-backed interrupt cannot be
1202                          * in the PENDING_ACTIVE stage.
1203                          */
1204                         vgic_irq_set_queued(vcpu, irq);
1205                 }
1206         }
1207
1208         vgic_set_lr(vcpu, lr_nr, vlr);
1209         vgic_sync_lr_elrsr(vcpu, lr_nr, vlr);
1210 }
1211
1212 /*
1213  * Queue an interrupt to a CPU virtual interface. Return true on success,
1214  * or false if it wasn't possible to queue it.
1215  * sgi_source must be zero for any non-SGI interrupts.
1216  */
1217 bool vgic_queue_irq(struct kvm_vcpu *vcpu, u8 sgi_source_id, int irq)
1218 {
1219         struct vgic_cpu *vgic_cpu = &vcpu->arch.vgic_cpu;
1220         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
1221         struct vgic_lr vlr;
1222         int lr;
1223
1224         /* Sanitize the input... */
1225         BUG_ON(sgi_source_id & ~7);
1226         BUG_ON(sgi_source_id && irq >= VGIC_NR_SGIS);
1227         BUG_ON(irq >= dist->nr_irqs);
1228
1229         kvm_debug("Queue IRQ%d\n", irq);
1230
1231         lr = vgic_cpu->vgic_irq_lr_map[irq];
1232
1233         /* Do we have an active interrupt for the same CPUID? */
1234         if (lr != LR_EMPTY) {
1235                 vlr = vgic_get_lr(vcpu, lr);
1236                 if (vlr.source == sgi_source_id) {
1237                         kvm_debug("LR%d piggyback for IRQ%d\n", lr, vlr.irq);
1238                         BUG_ON(!test_bit(lr, vgic_cpu->lr_used));
1239                         vgic_queue_irq_to_lr(vcpu, irq, lr, vlr);
1240                         return true;
1241                 }
1242         }
1243
1244         /* Try to use another LR for this interrupt */
1245         lr = find_first_zero_bit((unsigned long *)vgic_cpu->lr_used,
1246                                vgic->nr_lr);
1247         if (lr >= vgic->nr_lr)
1248                 return false;
1249
1250         kvm_debug("LR%d allocated for IRQ%d %x\n", lr, irq, sgi_source_id);
1251         vgic_cpu->vgic_irq_lr_map[irq] = lr;
1252         set_bit(lr, vgic_cpu->lr_used);
1253
1254         vlr.irq = irq;
1255         vlr.source = sgi_source_id;
1256         vlr.state = 0;
1257         vgic_queue_irq_to_lr(vcpu, irq, lr, vlr);
1258
1259         return true;
1260 }
1261
1262 static bool vgic_queue_hwirq(struct kvm_vcpu *vcpu, int irq)
1263 {
1264         if (!vgic_can_sample_irq(vcpu, irq))
1265                 return true; /* level interrupt, already queued */
1266
1267         if (vgic_queue_irq(vcpu, 0, irq)) {
1268                 if (vgic_irq_is_edge(vcpu, irq)) {
1269                         vgic_dist_irq_clear_pending(vcpu, irq);
1270                         vgic_cpu_irq_clear(vcpu, irq);
1271                 } else {
1272                         vgic_irq_set_queued(vcpu, irq);
1273                 }
1274
1275                 return true;
1276         }
1277
1278         return false;
1279 }
1280
1281 /*
1282  * Fill the list registers with pending interrupts before running the
1283  * guest.
1284  */
1285 static void __kvm_vgic_flush_hwstate(struct kvm_vcpu *vcpu)
1286 {
1287         struct vgic_cpu *vgic_cpu = &vcpu->arch.vgic_cpu;
1288         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
1289         unsigned long *pa_percpu, *pa_shared;
1290         int i, vcpu_id;
1291         int overflow = 0;
1292         int nr_shared = vgic_nr_shared_irqs(dist);
1293
1294         vcpu_id = vcpu->vcpu_id;
1295
1296         pa_percpu = vcpu->arch.vgic_cpu.pend_act_percpu;
1297         pa_shared = vcpu->arch.vgic_cpu.pend_act_shared;
1298
1299         bitmap_or(pa_percpu, vgic_cpu->pending_percpu, vgic_cpu->active_percpu,
1300                   VGIC_NR_PRIVATE_IRQS);
1301         bitmap_or(pa_shared, vgic_cpu->pending_shared, vgic_cpu->active_shared,
1302                   nr_shared);
1303         /*
1304          * We may not have any pending interrupt, or the interrupts
1305          * may have been serviced from another vcpu. In all cases,
1306          * move along.
1307          */
1308         if (!kvm_vgic_vcpu_pending_irq(vcpu) && !kvm_vgic_vcpu_active_irq(vcpu))
1309                 goto epilog;
1310
1311         /* SGIs */
1312         for_each_set_bit(i, pa_percpu, VGIC_NR_SGIS) {
1313                 if (!queue_sgi(vcpu, i))
1314                         overflow = 1;
1315         }
1316
1317         /* PPIs */
1318         for_each_set_bit_from(i, pa_percpu, VGIC_NR_PRIVATE_IRQS) {
1319                 if (!vgic_queue_hwirq(vcpu, i))
1320                         overflow = 1;
1321         }
1322
1323         /* SPIs */
1324         for_each_set_bit(i, pa_shared, nr_shared) {
1325                 if (!vgic_queue_hwirq(vcpu, i + VGIC_NR_PRIVATE_IRQS))
1326                         overflow = 1;
1327         }
1328
1329
1330
1331
1332 epilog:
1333         if (overflow) {
1334                 vgic_enable_underflow(vcpu);
1335         } else {
1336                 vgic_disable_underflow(vcpu);
1337                 /*
1338                  * We're about to run this VCPU, and we've consumed
1339                  * everything the distributor had in store for
1340                  * us. Claim we don't have anything pending. We'll
1341                  * adjust that if needed while exiting.
1342                  */
1343                 clear_bit(vcpu_id, dist->irq_pending_on_cpu);
1344         }
1345 }
1346
1347 static int process_level_irq(struct kvm_vcpu *vcpu, int lr, struct vgic_lr vlr)
1348 {
1349         int level_pending = 0;
1350
1351         vlr.state = 0;
1352         vlr.hwirq = 0;
1353         vgic_set_lr(vcpu, lr, vlr);
1354
1355         /*
1356          * If the IRQ was EOIed (called from vgic_process_maintenance) or it
1357          * went from active to non-active (called from vgic_sync_hwirq) it was
1358          * also ACKed and we we therefore assume we can clear the soft pending
1359          * state (should it had been set) for this interrupt.
1360          *
1361          * Note: if the IRQ soft pending state was set after the IRQ was
1362          * acked, it actually shouldn't be cleared, but we have no way of
1363          * knowing that unless we start trapping ACKs when the soft-pending
1364          * state is set.
1365          */
1366         vgic_dist_irq_clear_soft_pend(vcpu, vlr.irq);
1367
1368         /*
1369          * Tell the gic to start sampling the line of this interrupt again.
1370          */
1371         vgic_irq_clear_queued(vcpu, vlr.irq);
1372
1373         /* Any additional pending interrupt? */
1374         if (vgic_dist_irq_get_level(vcpu, vlr.irq)) {
1375                 vgic_cpu_irq_set(vcpu, vlr.irq);
1376                 level_pending = 1;
1377         } else {
1378                 vgic_dist_irq_clear_pending(vcpu, vlr.irq);
1379                 vgic_cpu_irq_clear(vcpu, vlr.irq);
1380         }
1381
1382         /*
1383          * Despite being EOIed, the LR may not have
1384          * been marked as empty.
1385          */
1386         vgic_sync_lr_elrsr(vcpu, lr, vlr);
1387
1388         return level_pending;
1389 }
1390
1391 static bool vgic_process_maintenance(struct kvm_vcpu *vcpu)
1392 {
1393         u32 status = vgic_get_interrupt_status(vcpu);
1394         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
1395         struct kvm *kvm = vcpu->kvm;
1396         int level_pending = 0;
1397
1398         kvm_debug("STATUS = %08x\n", status);
1399
1400         if (status & INT_STATUS_EOI) {
1401                 /*
1402                  * Some level interrupts have been EOIed. Clear their
1403                  * active bit.
1404                  */
1405                 u64 eisr = vgic_get_eisr(vcpu);
1406                 unsigned long *eisr_ptr = u64_to_bitmask(&eisr);
1407                 int lr;
1408
1409                 for_each_set_bit(lr, eisr_ptr, vgic->nr_lr) {
1410                         struct vgic_lr vlr = vgic_get_lr(vcpu, lr);
1411
1412                         WARN_ON(vgic_irq_is_edge(vcpu, vlr.irq));
1413                         WARN_ON(vlr.state & LR_STATE_MASK);
1414
1415
1416                         /*
1417                          * kvm_notify_acked_irq calls kvm_set_irq()
1418                          * to reset the IRQ level, which grabs the dist->lock
1419                          * so we call this before taking the dist->lock.
1420                          */
1421                         kvm_notify_acked_irq(kvm, 0,
1422                                              vlr.irq - VGIC_NR_PRIVATE_IRQS);
1423
1424                         spin_lock(&dist->lock);
1425                         level_pending |= process_level_irq(vcpu, lr, vlr);
1426                         spin_unlock(&dist->lock);
1427                 }
1428         }
1429
1430         if (status & INT_STATUS_UNDERFLOW)
1431                 vgic_disable_underflow(vcpu);
1432
1433         /*
1434          * In the next iterations of the vcpu loop, if we sync the vgic state
1435          * after flushing it, but before entering the guest (this happens for
1436          * pending signals and vmid rollovers), then make sure we don't pick
1437          * up any old maintenance interrupts here.
1438          */
1439         vgic_clear_eisr(vcpu);
1440
1441         return level_pending;
1442 }
1443
1444 /*
1445  * Save the physical active state, and reset it to inactive.
1446  *
1447  * Return 1 if HW interrupt went from active to inactive, and 0 otherwise.
1448  */
1449 static int vgic_sync_hwirq(struct kvm_vcpu *vcpu, struct vgic_lr vlr)
1450 {
1451         struct irq_phys_map *map;
1452         int ret;
1453
1454         if (!(vlr.state & LR_HW))
1455                 return 0;
1456
1457         map = vgic_irq_map_search(vcpu, vlr.irq);
1458         BUG_ON(!map);
1459
1460         ret = irq_get_irqchip_state(map->irq,
1461                                     IRQCHIP_STATE_ACTIVE,
1462                                     &map->active);
1463
1464         WARN_ON(ret);
1465
1466         if (map->active)
1467                 return 0;
1468
1469         return 1;
1470 }
1471
1472 /* Sync back the VGIC state after a guest run */
1473 static void __kvm_vgic_sync_hwstate(struct kvm_vcpu *vcpu)
1474 {
1475         struct vgic_cpu *vgic_cpu = &vcpu->arch.vgic_cpu;
1476         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
1477         u64 elrsr;
1478         unsigned long *elrsr_ptr;
1479         int lr, pending;
1480         bool level_pending;
1481
1482         level_pending = vgic_process_maintenance(vcpu);
1483         elrsr = vgic_get_elrsr(vcpu);
1484         elrsr_ptr = u64_to_bitmask(&elrsr);
1485
1486         /* Deal with HW interrupts, and clear mappings for empty LRs */
1487         for (lr = 0; lr < vgic->nr_lr; lr++) {
1488                 struct vgic_lr vlr;
1489
1490                 if (!test_bit(lr, vgic_cpu->lr_used))
1491                         continue;
1492
1493                 vlr = vgic_get_lr(vcpu, lr);
1494                 if (vgic_sync_hwirq(vcpu, vlr)) {
1495                         /*
1496                          * So this is a HW interrupt that the guest
1497                          * EOI-ed. Clean the LR state and allow the
1498                          * interrupt to be sampled again.
1499                          */
1500                         vlr.state = 0;
1501                         vlr.hwirq = 0;
1502                         vgic_set_lr(vcpu, lr, vlr);
1503                         vgic_irq_clear_queued(vcpu, vlr.irq);
1504                         set_bit(lr, elrsr_ptr);
1505                 }
1506
1507                 if (!test_bit(lr, elrsr_ptr))
1508                         continue;
1509
1510                 clear_bit(lr, vgic_cpu->lr_used);
1511
1512                 BUG_ON(vlr.irq >= dist->nr_irqs);
1513                 vgic_cpu->vgic_irq_lr_map[vlr.irq] = LR_EMPTY;
1514         }
1515
1516         /* Check if we still have something up our sleeve... */
1517         pending = find_first_zero_bit(elrsr_ptr, vgic->nr_lr);
1518         if (level_pending || pending < vgic->nr_lr)
1519                 set_bit(vcpu->vcpu_id, dist->irq_pending_on_cpu);
1520 }
1521
1522 void kvm_vgic_flush_hwstate(struct kvm_vcpu *vcpu)
1523 {
1524         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
1525
1526         if (!irqchip_in_kernel(vcpu->kvm))
1527                 return;
1528
1529         spin_lock(&dist->lock);
1530         __kvm_vgic_flush_hwstate(vcpu);
1531         spin_unlock(&dist->lock);
1532 }
1533
1534 void kvm_vgic_sync_hwstate(struct kvm_vcpu *vcpu)
1535 {
1536         if (!irqchip_in_kernel(vcpu->kvm))
1537                 return;
1538
1539         __kvm_vgic_sync_hwstate(vcpu);
1540 }
1541
1542 int kvm_vgic_vcpu_pending_irq(struct kvm_vcpu *vcpu)
1543 {
1544         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
1545
1546         if (!irqchip_in_kernel(vcpu->kvm))
1547                 return 0;
1548
1549         return test_bit(vcpu->vcpu_id, dist->irq_pending_on_cpu);
1550 }
1551
1552 int kvm_vgic_vcpu_active_irq(struct kvm_vcpu *vcpu)
1553 {
1554         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
1555
1556         if (!irqchip_in_kernel(vcpu->kvm))
1557                 return 0;
1558
1559         return test_bit(vcpu->vcpu_id, dist->irq_active_on_cpu);
1560 }
1561
1562
1563 void vgic_kick_vcpus(struct kvm *kvm)
1564 {
1565         struct kvm_vcpu *vcpu;
1566         int c;
1567
1568         /*
1569          * We've injected an interrupt, time to find out who deserves
1570          * a good kick...
1571          */
1572         kvm_for_each_vcpu(c, vcpu, kvm) {
1573                 if (kvm_vgic_vcpu_pending_irq(vcpu))
1574                         kvm_vcpu_kick(vcpu);
1575         }
1576 }
1577
1578 static int vgic_validate_injection(struct kvm_vcpu *vcpu, int irq, int level)
1579 {
1580         int edge_triggered = vgic_irq_is_edge(vcpu, irq);
1581
1582         /*
1583          * Only inject an interrupt if:
1584          * - edge triggered and we have a rising edge
1585          * - level triggered and we change level
1586          */
1587         if (edge_triggered) {
1588                 int state = vgic_dist_irq_is_pending(vcpu, irq);
1589                 return level > state;
1590         } else {
1591                 int state = vgic_dist_irq_get_level(vcpu, irq);
1592                 return level != state;
1593         }
1594 }
1595
1596 static int vgic_update_irq_pending(struct kvm *kvm, int cpuid,
1597                                    struct irq_phys_map *map,
1598                                    unsigned int irq_num, bool level)
1599 {
1600         struct vgic_dist *dist = &kvm->arch.vgic;
1601         struct kvm_vcpu *vcpu;
1602         int edge_triggered, level_triggered;
1603         int enabled;
1604         bool ret = true, can_inject = true;
1605
1606         if (irq_num >= min(kvm->arch.vgic.nr_irqs, 1020))
1607                 return -EINVAL;
1608
1609         spin_lock(&dist->lock);
1610
1611         vcpu = kvm_get_vcpu(kvm, cpuid);
1612         edge_triggered = vgic_irq_is_edge(vcpu, irq_num);
1613         level_triggered = !edge_triggered;
1614
1615         if (!vgic_validate_injection(vcpu, irq_num, level)) {
1616                 ret = false;
1617                 goto out;
1618         }
1619
1620         if (irq_num >= VGIC_NR_PRIVATE_IRQS) {
1621                 cpuid = dist->irq_spi_cpu[irq_num - VGIC_NR_PRIVATE_IRQS];
1622                 if (cpuid == VCPU_NOT_ALLOCATED) {
1623                         /* Pretend we use CPU0, and prevent injection */
1624                         cpuid = 0;
1625                         can_inject = false;
1626                 }
1627                 vcpu = kvm_get_vcpu(kvm, cpuid);
1628         }
1629
1630         kvm_debug("Inject IRQ%d level %d CPU%d\n", irq_num, level, cpuid);
1631
1632         if (level) {
1633                 if (level_triggered)
1634                         vgic_dist_irq_set_level(vcpu, irq_num);
1635                 vgic_dist_irq_set_pending(vcpu, irq_num);
1636         } else {
1637                 if (level_triggered) {
1638                         vgic_dist_irq_clear_level(vcpu, irq_num);
1639                         if (!vgic_dist_irq_soft_pend(vcpu, irq_num)) {
1640                                 vgic_dist_irq_clear_pending(vcpu, irq_num);
1641                                 vgic_cpu_irq_clear(vcpu, irq_num);
1642                                 if (!compute_pending_for_cpu(vcpu))
1643                                         clear_bit(cpuid, dist->irq_pending_on_cpu);
1644                         }
1645                 }
1646
1647                 ret = false;
1648                 goto out;
1649         }
1650
1651         enabled = vgic_irq_is_enabled(vcpu, irq_num);
1652
1653         if (!enabled || !can_inject) {
1654                 ret = false;
1655                 goto out;
1656         }
1657
1658         if (!vgic_can_sample_irq(vcpu, irq_num)) {
1659                 /*
1660                  * Level interrupt in progress, will be picked up
1661                  * when EOId.
1662                  */
1663                 ret = false;
1664                 goto out;
1665         }
1666
1667         if (level) {
1668                 vgic_cpu_irq_set(vcpu, irq_num);
1669                 set_bit(cpuid, dist->irq_pending_on_cpu);
1670         }
1671
1672 out:
1673         spin_unlock(&dist->lock);
1674
1675         if (ret) {
1676                 /* kick the specified vcpu */
1677                 kvm_vcpu_kick(kvm_get_vcpu(kvm, cpuid));
1678         }
1679
1680         return 0;
1681 }
1682
1683 static int vgic_lazy_init(struct kvm *kvm)
1684 {
1685         int ret = 0;
1686
1687         if (unlikely(!vgic_initialized(kvm))) {
1688                 /*
1689                  * We only provide the automatic initialization of the VGIC
1690                  * for the legacy case of a GICv2. Any other type must
1691                  * be explicitly initialized once setup with the respective
1692                  * KVM device call.
1693                  */
1694                 if (kvm->arch.vgic.vgic_model != KVM_DEV_TYPE_ARM_VGIC_V2)
1695                         return -EBUSY;
1696
1697                 mutex_lock(&kvm->lock);
1698                 ret = vgic_init(kvm);
1699                 mutex_unlock(&kvm->lock);
1700         }
1701
1702         return ret;
1703 }
1704
1705 /**
1706  * kvm_vgic_inject_irq - Inject an IRQ from a device to the vgic
1707  * @kvm:     The VM structure pointer
1708  * @cpuid:   The CPU for PPIs
1709  * @irq_num: The IRQ number that is assigned to the device. This IRQ
1710  *           must not be mapped to a HW interrupt.
1711  * @level:   Edge-triggered:  true:  to trigger the interrupt
1712  *                            false: to ignore the call
1713  *           Level-sensitive  true:  raise the input signal
1714  *                            false: lower the input signal
1715  *
1716  * The GIC is not concerned with devices being active-LOW or active-HIGH for
1717  * level-sensitive interrupts.  You can think of the level parameter as 1
1718  * being HIGH and 0 being LOW and all devices being active-HIGH.
1719  */
1720 int kvm_vgic_inject_irq(struct kvm *kvm, int cpuid, unsigned int irq_num,
1721                         bool level)
1722 {
1723         struct irq_phys_map *map;
1724         int ret;
1725
1726         ret = vgic_lazy_init(kvm);
1727         if (ret)
1728                 return ret;
1729
1730         map = vgic_irq_map_search(kvm_get_vcpu(kvm, cpuid), irq_num);
1731         if (map)
1732                 return -EINVAL;
1733
1734         return vgic_update_irq_pending(kvm, cpuid, NULL, irq_num, level);
1735 }
1736
1737 /**
1738  * kvm_vgic_inject_mapped_irq - Inject a physically mapped IRQ to the vgic
1739  * @kvm:     The VM structure pointer
1740  * @cpuid:   The CPU for PPIs
1741  * @map:     Pointer to a irq_phys_map structure describing the mapping
1742  * @level:   Edge-triggered:  true:  to trigger the interrupt
1743  *                            false: to ignore the call
1744  *           Level-sensitive  true:  raise the input signal
1745  *                            false: lower the input signal
1746  *
1747  * The GIC is not concerned with devices being active-LOW or active-HIGH for
1748  * level-sensitive interrupts.  You can think of the level parameter as 1
1749  * being HIGH and 0 being LOW and all devices being active-HIGH.
1750  */
1751 int kvm_vgic_inject_mapped_irq(struct kvm *kvm, int cpuid,
1752                                struct irq_phys_map *map, bool level)
1753 {
1754         int ret;
1755
1756         ret = vgic_lazy_init(kvm);
1757         if (ret)
1758                 return ret;
1759
1760         return vgic_update_irq_pending(kvm, cpuid, map, map->virt_irq, level);
1761 }
1762
1763 static irqreturn_t vgic_maintenance_handler(int irq, void *data)
1764 {
1765         /*
1766          * We cannot rely on the vgic maintenance interrupt to be
1767          * delivered synchronously. This means we can only use it to
1768          * exit the VM, and we perform the handling of EOIed
1769          * interrupts on the exit path (see vgic_process_maintenance).
1770          */
1771         return IRQ_HANDLED;
1772 }
1773
1774 static struct list_head *vgic_get_irq_phys_map_list(struct kvm_vcpu *vcpu,
1775                                                     int virt_irq)
1776 {
1777         if (virt_irq < VGIC_NR_PRIVATE_IRQS)
1778                 return &vcpu->arch.vgic_cpu.irq_phys_map_list;
1779         else
1780                 return &vcpu->kvm->arch.vgic.irq_phys_map_list;
1781 }
1782
1783 /**
1784  * kvm_vgic_map_phys_irq - map a virtual IRQ to a physical IRQ
1785  * @vcpu: The VCPU pointer
1786  * @virt_irq: The virtual irq number
1787  * @irq: The Linux IRQ number
1788  *
1789  * Establish a mapping between a guest visible irq (@virt_irq) and a
1790  * Linux irq (@irq). On injection, @virt_irq will be associated with
1791  * the physical interrupt represented by @irq. This mapping can be
1792  * established multiple times as long as the parameters are the same.
1793  *
1794  * Returns a valid pointer on success, and an error pointer otherwise
1795  */
1796 struct irq_phys_map *kvm_vgic_map_phys_irq(struct kvm_vcpu *vcpu,
1797                                            int virt_irq, int irq)
1798 {
1799         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
1800         struct list_head *root = vgic_get_irq_phys_map_list(vcpu, virt_irq);
1801         struct irq_phys_map *map;
1802         struct irq_phys_map_entry *entry;
1803         struct irq_desc *desc;
1804         struct irq_data *data;
1805         int phys_irq;
1806
1807         desc = irq_to_desc(irq);
1808         if (!desc) {
1809                 kvm_err("%s: no interrupt descriptor\n", __func__);
1810                 return ERR_PTR(-EINVAL);
1811         }
1812
1813         data = irq_desc_get_irq_data(desc);
1814         while (data->parent_data)
1815                 data = data->parent_data;
1816
1817         phys_irq = data->hwirq;
1818
1819         /* Create a new mapping */
1820         entry = kzalloc(sizeof(*entry), GFP_KERNEL);
1821         if (!entry)
1822                 return ERR_PTR(-ENOMEM);
1823
1824         spin_lock(&dist->irq_phys_map_lock);
1825
1826         /* Try to match an existing mapping */
1827         map = vgic_irq_map_search(vcpu, virt_irq);
1828         if (map) {
1829                 /* Make sure this mapping matches */
1830                 if (map->phys_irq != phys_irq   ||
1831                     map->irq      != irq)
1832                         map = ERR_PTR(-EINVAL);
1833
1834                 /* Found an existing, valid mapping */
1835                 goto out;
1836         }
1837
1838         map           = &entry->map;
1839         map->virt_irq = virt_irq;
1840         map->phys_irq = phys_irq;
1841         map->irq      = irq;
1842
1843         list_add_tail_rcu(&entry->entry, root);
1844
1845 out:
1846         spin_unlock(&dist->irq_phys_map_lock);
1847         /* If we've found a hit in the existing list, free the useless
1848          * entry */
1849         if (IS_ERR(map) || map != &entry->map)
1850                 kfree(entry);
1851         return map;
1852 }
1853
1854 static struct irq_phys_map *vgic_irq_map_search(struct kvm_vcpu *vcpu,
1855                                                 int virt_irq)
1856 {
1857         struct list_head *root = vgic_get_irq_phys_map_list(vcpu, virt_irq);
1858         struct irq_phys_map_entry *entry;
1859         struct irq_phys_map *map;
1860
1861         rcu_read_lock();
1862
1863         list_for_each_entry_rcu(entry, root, entry) {
1864                 map = &entry->map;
1865                 if (map->virt_irq == virt_irq) {
1866                         rcu_read_unlock();
1867                         return map;
1868                 }
1869         }
1870
1871         rcu_read_unlock();
1872
1873         return NULL;
1874 }
1875
1876 static void vgic_free_phys_irq_map_rcu(struct rcu_head *rcu)
1877 {
1878         struct irq_phys_map_entry *entry;
1879
1880         entry = container_of(rcu, struct irq_phys_map_entry, rcu);
1881         kfree(entry);
1882 }
1883
1884 /**
1885  * kvm_vgic_get_phys_irq_active - Return the active state of a mapped IRQ
1886  *
1887  * Return the logical active state of a mapped interrupt. This doesn't
1888  * necessarily reflects the current HW state.
1889  */
1890 bool kvm_vgic_get_phys_irq_active(struct irq_phys_map *map)
1891 {
1892         BUG_ON(!map);
1893         return map->active;
1894 }
1895
1896 /**
1897  * kvm_vgic_set_phys_irq_active - Set the active state of a mapped IRQ
1898  *
1899  * Set the logical active state of a mapped interrupt. This doesn't
1900  * immediately affects the HW state.
1901  */
1902 void kvm_vgic_set_phys_irq_active(struct irq_phys_map *map, bool active)
1903 {
1904         BUG_ON(!map);
1905         map->active = active;
1906 }
1907
1908 /**
1909  * kvm_vgic_unmap_phys_irq - Remove a virtual to physical IRQ mapping
1910  * @vcpu: The VCPU pointer
1911  * @map: The pointer to a mapping obtained through kvm_vgic_map_phys_irq
1912  *
1913  * Remove an existing mapping between virtual and physical interrupts.
1914  */
1915 int kvm_vgic_unmap_phys_irq(struct kvm_vcpu *vcpu, struct irq_phys_map *map)
1916 {
1917         struct vgic_dist *dist = &vcpu->kvm->arch.vgic;
1918         struct irq_phys_map_entry *entry;
1919         struct list_head *root;
1920
1921         if (!map)
1922                 return -EINVAL;
1923
1924         root = vgic_get_irq_phys_map_list(vcpu, map->virt_irq);
1925
1926         spin_lock(&dist->irq_phys_map_lock);
1927
1928         list_for_each_entry(entry, root, entry) {
1929                 if (&entry->map == map) {
1930                         list_del_rcu(&entry->entry);
1931                         call_rcu(&entry->rcu, vgic_free_phys_irq_map_rcu);
1932                         break;
1933                 }
1934         }
1935
1936         spin_unlock(&dist->irq_phys_map_lock);
1937
1938         return 0;
1939 }
1940
1941 static void vgic_destroy_irq_phys_map(struct kvm *kvm, struct list_head *root)
1942 {
1943         struct vgic_dist *dist = &kvm->arch.vgic;
1944         struct irq_phys_map_entry *entry;
1945
1946         spin_lock(&dist->irq_phys_map_lock);
1947
1948         list_for_each_entry(entry, root, entry) {
1949                 list_del_rcu(&entry->entry);
1950                 call_rcu(&entry->rcu, vgic_free_phys_irq_map_rcu);
1951         }
1952
1953         spin_unlock(&dist->irq_phys_map_lock);
1954 }
1955
1956 void kvm_vgic_vcpu_destroy(struct kvm_vcpu *vcpu)
1957 {
1958         struct vgic_cpu *vgic_cpu = &vcpu->arch.vgic_cpu;
1959
1960         kfree(vgic_cpu->pending_shared);
1961         kfree(vgic_cpu->active_shared);
1962         kfree(vgic_cpu->pend_act_shared);
1963         kfree(vgic_cpu->vgic_irq_lr_map);
1964         vgic_destroy_irq_phys_map(vcpu->kvm, &vgic_cpu->irq_phys_map_list);
1965         vgic_cpu->pending_shared = NULL;
1966         vgic_cpu->active_shared = NULL;
1967         vgic_cpu->pend_act_shared = NULL;
1968         vgic_cpu->vgic_irq_lr_map = NULL;
1969 }
1970
1971 static int vgic_vcpu_init_maps(struct kvm_vcpu *vcpu, int nr_irqs)
1972 {
1973         struct vgic_cpu *vgic_cpu = &vcpu->arch.vgic_cpu;
1974
1975         int sz = (nr_irqs - VGIC_NR_PRIVATE_IRQS) / 8;
1976         vgic_cpu->pending_shared = kzalloc(sz, GFP_KERNEL);
1977         vgic_cpu->active_shared = kzalloc(sz, GFP_KERNEL);
1978         vgic_cpu->pend_act_shared = kzalloc(sz, GFP_KERNEL);
1979         vgic_cpu->vgic_irq_lr_map = kmalloc(nr_irqs, GFP_KERNEL);
1980
1981         if (!vgic_cpu->pending_shared
1982                 || !vgic_cpu->active_shared
1983                 || !vgic_cpu->pend_act_shared
1984                 || !vgic_cpu->vgic_irq_lr_map) {
1985                 kvm_vgic_vcpu_destroy(vcpu);
1986                 return -ENOMEM;
1987         }
1988
1989         memset(vgic_cpu->vgic_irq_lr_map, LR_EMPTY, nr_irqs);
1990
1991         /*
1992          * Store the number of LRs per vcpu, so we don't have to go
1993          * all the way to the distributor structure to find out. Only
1994          * assembly code should use this one.
1995          */
1996         vgic_cpu->nr_lr = vgic->nr_lr;
1997
1998         return 0;
1999 }
2000
2001 /**
2002  * kvm_vgic_vcpu_early_init - Earliest possible per-vcpu vgic init stage
2003  *
2004  * No memory allocation should be performed here, only static init.
2005  */
2006 void kvm_vgic_vcpu_early_init(struct kvm_vcpu *vcpu)
2007 {
2008         struct vgic_cpu *vgic_cpu = &vcpu->arch.vgic_cpu;
2009         INIT_LIST_HEAD(&vgic_cpu->irq_phys_map_list);
2010 }
2011
2012 /**
2013  * kvm_vgic_get_max_vcpus - Get the maximum number of VCPUs allowed by HW
2014  *
2015  * The host's GIC naturally limits the maximum amount of VCPUs a guest
2016  * can use.
2017  */
2018 int kvm_vgic_get_max_vcpus(void)
2019 {
2020         return vgic->max_gic_vcpus;
2021 }
2022
2023 void kvm_vgic_destroy(struct kvm *kvm)
2024 {
2025         struct vgic_dist *dist = &kvm->arch.vgic;
2026         struct kvm_vcpu *vcpu;
2027         int i;
2028
2029         kvm_for_each_vcpu(i, vcpu, kvm)
2030                 kvm_vgic_vcpu_destroy(vcpu);
2031
2032         vgic_free_bitmap(&dist->irq_enabled);
2033         vgic_free_bitmap(&dist->irq_level);
2034         vgic_free_bitmap(&dist->irq_pending);
2035         vgic_free_bitmap(&dist->irq_soft_pend);
2036         vgic_free_bitmap(&dist->irq_queued);
2037         vgic_free_bitmap(&dist->irq_cfg);
2038         vgic_free_bytemap(&dist->irq_priority);
2039         if (dist->irq_spi_target) {
2040                 for (i = 0; i < dist->nr_cpus; i++)
2041                         vgic_free_bitmap(&dist->irq_spi_target[i]);
2042         }
2043         kfree(dist->irq_sgi_sources);
2044         kfree(dist->irq_spi_cpu);
2045         kfree(dist->irq_spi_mpidr);
2046         kfree(dist->irq_spi_target);
2047         kfree(dist->irq_pending_on_cpu);
2048         kfree(dist->irq_active_on_cpu);
2049         vgic_destroy_irq_phys_map(kvm, &dist->irq_phys_map_list);
2050         dist->irq_sgi_sources = NULL;
2051         dist->irq_spi_cpu = NULL;
2052         dist->irq_spi_target = NULL;
2053         dist->irq_pending_on_cpu = NULL;
2054         dist->irq_active_on_cpu = NULL;
2055         dist->nr_cpus = 0;
2056 }
2057
2058 /*
2059  * Allocate and initialize the various data structures. Must be called
2060  * with kvm->lock held!
2061  */
2062 int vgic_init(struct kvm *kvm)
2063 {
2064         struct vgic_dist *dist = &kvm->arch.vgic;
2065         struct kvm_vcpu *vcpu;
2066         int nr_cpus, nr_irqs;
2067         int ret, i, vcpu_id;
2068
2069         if (vgic_initialized(kvm))
2070                 return 0;
2071
2072         nr_cpus = dist->nr_cpus = atomic_read(&kvm->online_vcpus);
2073         if (!nr_cpus)           /* No vcpus? Can't be good... */
2074                 return -ENODEV;
2075
2076         /*
2077          * If nobody configured the number of interrupts, use the
2078          * legacy one.
2079          */
2080         if (!dist->nr_irqs)
2081                 dist->nr_irqs = VGIC_NR_IRQS_LEGACY;
2082
2083         nr_irqs = dist->nr_irqs;
2084
2085         ret  = vgic_init_bitmap(&dist->irq_enabled, nr_cpus, nr_irqs);
2086         ret |= vgic_init_bitmap(&dist->irq_level, nr_cpus, nr_irqs);
2087         ret |= vgic_init_bitmap(&dist->irq_pending, nr_cpus, nr_irqs);
2088         ret |= vgic_init_bitmap(&dist->irq_soft_pend, nr_cpus, nr_irqs);
2089         ret |= vgic_init_bitmap(&dist->irq_queued, nr_cpus, nr_irqs);
2090         ret |= vgic_init_bitmap(&dist->irq_active, nr_cpus, nr_irqs);
2091         ret |= vgic_init_bitmap(&dist->irq_cfg, nr_cpus, nr_irqs);
2092         ret |= vgic_init_bytemap(&dist->irq_priority, nr_cpus, nr_irqs);
2093
2094         if (ret)
2095                 goto out;
2096
2097         dist->irq_sgi_sources = kzalloc(nr_cpus * VGIC_NR_SGIS, GFP_KERNEL);
2098         dist->irq_spi_cpu = kzalloc(nr_irqs - VGIC_NR_PRIVATE_IRQS, GFP_KERNEL);
2099         dist->irq_spi_target = kzalloc(sizeof(*dist->irq_spi_target) * nr_cpus,
2100                                        GFP_KERNEL);
2101         dist->irq_pending_on_cpu = kzalloc(BITS_TO_LONGS(nr_cpus) * sizeof(long),
2102                                            GFP_KERNEL);
2103         dist->irq_active_on_cpu = kzalloc(BITS_TO_LONGS(nr_cpus) * sizeof(long),
2104                                            GFP_KERNEL);
2105         if (!dist->irq_sgi_sources ||
2106             !dist->irq_spi_cpu ||
2107             !dist->irq_spi_target ||
2108             !dist->irq_pending_on_cpu ||
2109             !dist->irq_active_on_cpu) {
2110                 ret = -ENOMEM;
2111                 goto out;
2112         }
2113
2114         for (i = 0; i < nr_cpus; i++)
2115                 ret |= vgic_init_bitmap(&dist->irq_spi_target[i],
2116                                         nr_cpus, nr_irqs);
2117
2118         if (ret)
2119                 goto out;
2120
2121         ret = kvm->arch.vgic.vm_ops.init_model(kvm);
2122         if (ret)
2123                 goto out;
2124
2125         kvm_for_each_vcpu(vcpu_id, vcpu, kvm) {
2126                 ret = vgic_vcpu_init_maps(vcpu, nr_irqs);
2127                 if (ret) {
2128                         kvm_err("VGIC: Failed to allocate vcpu memory\n");
2129                         break;
2130                 }
2131
2132                 for (i = 0; i < dist->nr_irqs; i++) {
2133                         if (i < VGIC_NR_PPIS)
2134                                 vgic_bitmap_set_irq_val(&dist->irq_enabled,
2135                                                         vcpu->vcpu_id, i, 1);
2136                         if (i < VGIC_NR_PRIVATE_IRQS)
2137                                 vgic_bitmap_set_irq_val(&dist->irq_cfg,
2138                                                         vcpu->vcpu_id, i,
2139                                                         VGIC_CFG_EDGE);
2140                 }
2141
2142                 vgic_enable(vcpu);
2143         }
2144
2145 out:
2146         if (ret)
2147                 kvm_vgic_destroy(kvm);
2148
2149         return ret;
2150 }
2151
2152 static int init_vgic_model(struct kvm *kvm, int type)
2153 {
2154         switch (type) {
2155         case KVM_DEV_TYPE_ARM_VGIC_V2:
2156                 vgic_v2_init_emulation(kvm);
2157                 break;
2158 #ifdef CONFIG_ARM_GIC_V3
2159         case KVM_DEV_TYPE_ARM_VGIC_V3:
2160                 vgic_v3_init_emulation(kvm);
2161                 break;
2162 #endif
2163         default:
2164                 return -ENODEV;
2165         }
2166
2167         if (atomic_read(&kvm->online_vcpus) > kvm->arch.max_vcpus)
2168                 return -E2BIG;
2169
2170         return 0;
2171 }
2172
2173 /**
2174  * kvm_vgic_early_init - Earliest possible vgic initialization stage
2175  *
2176  * No memory allocation should be performed here, only static init.
2177  */
2178 void kvm_vgic_early_init(struct kvm *kvm)
2179 {
2180         spin_lock_init(&kvm->arch.vgic.lock);
2181         spin_lock_init(&kvm->arch.vgic.irq_phys_map_lock);
2182         INIT_LIST_HEAD(&kvm->arch.vgic.irq_phys_map_list);
2183 }
2184
2185 int kvm_vgic_create(struct kvm *kvm, u32 type)
2186 {
2187         int i, vcpu_lock_idx = -1, ret;
2188         struct kvm_vcpu *vcpu;
2189
2190         mutex_lock(&kvm->lock);
2191
2192         if (irqchip_in_kernel(kvm)) {
2193                 ret = -EEXIST;
2194                 goto out;
2195         }
2196
2197         /*
2198          * This function is also called by the KVM_CREATE_IRQCHIP handler,
2199          * which had no chance yet to check the availability of the GICv2
2200          * emulation. So check this here again. KVM_CREATE_DEVICE does
2201          * the proper checks already.
2202          */
2203         if (type == KVM_DEV_TYPE_ARM_VGIC_V2 && !vgic->can_emulate_gicv2) {
2204                 ret = -ENODEV;
2205                 goto out;
2206         }
2207
2208         /*
2209          * Any time a vcpu is run, vcpu_load is called which tries to grab the
2210          * vcpu->mutex.  By grabbing the vcpu->mutex of all VCPUs we ensure
2211          * that no other VCPUs are run while we create the vgic.
2212          */
2213         ret = -EBUSY;
2214         kvm_for_each_vcpu(i, vcpu, kvm) {
2215                 if (!mutex_trylock(&vcpu->mutex))
2216                         goto out_unlock;
2217                 vcpu_lock_idx = i;
2218         }
2219
2220         kvm_for_each_vcpu(i, vcpu, kvm) {
2221                 if (vcpu->arch.has_run_once)
2222                         goto out_unlock;
2223         }
2224         ret = 0;
2225
2226         ret = init_vgic_model(kvm, type);
2227         if (ret)
2228                 goto out_unlock;
2229
2230         kvm->arch.vgic.in_kernel = true;
2231         kvm->arch.vgic.vgic_model = type;
2232         kvm->arch.vgic.vctrl_base = vgic->vctrl_base;
2233         kvm->arch.vgic.vgic_dist_base = VGIC_ADDR_UNDEF;
2234         kvm->arch.vgic.vgic_cpu_base = VGIC_ADDR_UNDEF;
2235         kvm->arch.vgic.vgic_redist_base = VGIC_ADDR_UNDEF;
2236
2237 out_unlock:
2238         for (; vcpu_lock_idx >= 0; vcpu_lock_idx--) {
2239                 vcpu = kvm_get_vcpu(kvm, vcpu_lock_idx);
2240                 mutex_unlock(&vcpu->mutex);
2241         }
2242
2243 out:
2244         mutex_unlock(&kvm->lock);
2245         return ret;
2246 }
2247
2248 static int vgic_ioaddr_overlap(struct kvm *kvm)
2249 {
2250         phys_addr_t dist = kvm->arch.vgic.vgic_dist_base;
2251         phys_addr_t cpu = kvm->arch.vgic.vgic_cpu_base;
2252
2253         if (IS_VGIC_ADDR_UNDEF(dist) || IS_VGIC_ADDR_UNDEF(cpu))
2254                 return 0;
2255         if ((dist <= cpu && dist + KVM_VGIC_V2_DIST_SIZE > cpu) ||
2256             (cpu <= dist && cpu + KVM_VGIC_V2_CPU_SIZE > dist))
2257                 return -EBUSY;
2258         return 0;
2259 }
2260
2261 static int vgic_ioaddr_assign(struct kvm *kvm, phys_addr_t *ioaddr,
2262                               phys_addr_t addr, phys_addr_t size)
2263 {
2264         int ret;
2265
2266         if (addr & ~KVM_PHYS_MASK)
2267                 return -E2BIG;
2268
2269         if (addr & (SZ_4K - 1))
2270                 return -EINVAL;
2271
2272         if (!IS_VGIC_ADDR_UNDEF(*ioaddr))
2273                 return -EEXIST;
2274         if (addr + size < addr)
2275                 return -EINVAL;
2276
2277         *ioaddr = addr;
2278         ret = vgic_ioaddr_overlap(kvm);
2279         if (ret)
2280                 *ioaddr = VGIC_ADDR_UNDEF;
2281
2282         return ret;
2283 }
2284
2285 /**
2286  * kvm_vgic_addr - set or get vgic VM base addresses
2287  * @kvm:   pointer to the vm struct
2288  * @type:  the VGIC addr type, one of KVM_VGIC_V[23]_ADDR_TYPE_XXX
2289  * @addr:  pointer to address value
2290  * @write: if true set the address in the VM address space, if false read the
2291  *          address
2292  *
2293  * Set or get the vgic base addresses for the distributor and the virtual CPU
2294  * interface in the VM physical address space.  These addresses are properties
2295  * of the emulated core/SoC and therefore user space initially knows this
2296  * information.
2297  */
2298 int kvm_vgic_addr(struct kvm *kvm, unsigned long type, u64 *addr, bool write)
2299 {
2300         int r = 0;
2301         struct vgic_dist *vgic = &kvm->arch.vgic;
2302         int type_needed;
2303         phys_addr_t *addr_ptr, block_size;
2304         phys_addr_t alignment;
2305
2306         mutex_lock(&kvm->lock);
2307         switch (type) {
2308         case KVM_VGIC_V2_ADDR_TYPE_DIST:
2309                 type_needed = KVM_DEV_TYPE_ARM_VGIC_V2;
2310                 addr_ptr = &vgic->vgic_dist_base;
2311                 block_size = KVM_VGIC_V2_DIST_SIZE;
2312                 alignment = SZ_4K;
2313                 break;
2314         case KVM_VGIC_V2_ADDR_TYPE_CPU:
2315                 type_needed = KVM_DEV_TYPE_ARM_VGIC_V2;
2316                 addr_ptr = &vgic->vgic_cpu_base;
2317                 block_size = KVM_VGIC_V2_CPU_SIZE;
2318                 alignment = SZ_4K;
2319                 break;
2320 #ifdef CONFIG_ARM_GIC_V3
2321         case KVM_VGIC_V3_ADDR_TYPE_DIST:
2322                 type_needed = KVM_DEV_TYPE_ARM_VGIC_V3;
2323                 addr_ptr = &vgic->vgic_dist_base;
2324                 block_size = KVM_VGIC_V3_DIST_SIZE;
2325                 alignment = SZ_64K;
2326                 break;
2327         case KVM_VGIC_V3_ADDR_TYPE_REDIST:
2328                 type_needed = KVM_DEV_TYPE_ARM_VGIC_V3;
2329                 addr_ptr = &vgic->vgic_redist_base;
2330                 block_size = KVM_VGIC_V3_REDIST_SIZE;
2331                 alignment = SZ_64K;
2332                 break;
2333 #endif
2334         default:
2335                 r = -ENODEV;
2336                 goto out;
2337         }
2338
2339         if (vgic->vgic_model != type_needed) {
2340                 r = -ENODEV;
2341                 goto out;
2342         }
2343
2344         if (write) {
2345                 if (!IS_ALIGNED(*addr, alignment))
2346                         r = -EINVAL;
2347                 else
2348                         r = vgic_ioaddr_assign(kvm, addr_ptr, *addr,
2349                                                block_size);
2350         } else {
2351                 *addr = *addr_ptr;
2352         }
2353
2354 out:
2355         mutex_unlock(&kvm->lock);
2356         return r;
2357 }
2358
2359 int vgic_set_common_attr(struct kvm_device *dev, struct kvm_device_attr *attr)
2360 {
2361         int r;
2362
2363         switch (attr->group) {
2364         case KVM_DEV_ARM_VGIC_GRP_ADDR: {
2365                 u64 __user *uaddr = (u64 __user *)(long)attr->addr;
2366                 u64 addr;
2367                 unsigned long type = (unsigned long)attr->attr;
2368
2369                 if (copy_from_user(&addr, uaddr, sizeof(addr)))
2370                         return -EFAULT;
2371
2372                 r = kvm_vgic_addr(dev->kvm, type, &addr, true);
2373                 return (r == -ENODEV) ? -ENXIO : r;
2374         }
2375         case KVM_DEV_ARM_VGIC_GRP_NR_IRQS: {
2376                 u32 __user *uaddr = (u32 __user *)(long)attr->addr;
2377                 u32 val;
2378                 int ret = 0;
2379
2380                 if (get_user(val, uaddr))
2381                         return -EFAULT;
2382
2383                 /*
2384                  * We require:
2385                  * - at least 32 SPIs on top of the 16 SGIs and 16 PPIs
2386                  * - at most 1024 interrupts
2387                  * - a multiple of 32 interrupts
2388                  */
2389                 if (val < (VGIC_NR_PRIVATE_IRQS + 32) ||
2390                     val > VGIC_MAX_IRQS ||
2391                     (val & 31))
2392                         return -EINVAL;
2393
2394                 mutex_lock(&dev->kvm->lock);
2395
2396                 if (vgic_ready(dev->kvm) || dev->kvm->arch.vgic.nr_irqs)
2397                         ret = -EBUSY;
2398                 else
2399                         dev->kvm->arch.vgic.nr_irqs = val;
2400
2401                 mutex_unlock(&dev->kvm->lock);
2402
2403                 return ret;
2404         }
2405         case KVM_DEV_ARM_VGIC_GRP_CTRL: {
2406                 switch (attr->attr) {
2407                 case KVM_DEV_ARM_VGIC_CTRL_INIT:
2408                         r = vgic_init(dev->kvm);
2409                         return r;
2410                 }
2411                 break;
2412         }
2413         }
2414
2415         return -ENXIO;
2416 }
2417
2418 int vgic_get_common_attr(struct kvm_device *dev, struct kvm_device_attr *attr)
2419 {
2420         int r = -ENXIO;
2421
2422         switch (attr->group) {
2423         case KVM_DEV_ARM_VGIC_GRP_ADDR: {
2424                 u64 __user *uaddr = (u64 __user *)(long)attr->addr;
2425                 u64 addr;
2426                 unsigned long type = (unsigned long)attr->attr;
2427
2428                 r = kvm_vgic_addr(dev->kvm, type, &addr, false);
2429                 if (r)
2430                         return (r == -ENODEV) ? -ENXIO : r;
2431
2432                 if (copy_to_user(uaddr, &addr, sizeof(addr)))
2433                         return -EFAULT;
2434                 break;
2435         }
2436         case KVM_DEV_ARM_VGIC_GRP_NR_IRQS: {
2437                 u32 __user *uaddr = (u32 __user *)(long)attr->addr;
2438
2439                 r = put_user(dev->kvm->arch.vgic.nr_irqs, uaddr);
2440                 break;
2441         }
2442
2443         }
2444
2445         return r;
2446 }
2447
2448 int vgic_has_attr_regs(const struct vgic_io_range *ranges, phys_addr_t offset)
2449 {
2450         if (vgic_find_range(ranges, 4, offset))
2451                 return 0;
2452         else
2453                 return -ENXIO;
2454 }
2455
2456 static void vgic_init_maintenance_interrupt(void *info)
2457 {
2458         enable_percpu_irq(vgic->maint_irq, 0);
2459 }
2460
2461 static int vgic_cpu_notify(struct notifier_block *self,
2462                            unsigned long action, void *cpu)
2463 {
2464         switch (action) {
2465         case CPU_STARTING:
2466         case CPU_STARTING_FROZEN:
2467                 vgic_init_maintenance_interrupt(NULL);
2468                 break;
2469         case CPU_DYING:
2470         case CPU_DYING_FROZEN:
2471                 disable_percpu_irq(vgic->maint_irq);
2472                 break;
2473         }
2474
2475         return NOTIFY_OK;
2476 }
2477
2478 static struct notifier_block vgic_cpu_nb = {
2479         .notifier_call = vgic_cpu_notify,
2480 };
2481
2482 static const struct of_device_id vgic_ids[] = {
2483         { .compatible = "arm,cortex-a15-gic",   .data = vgic_v2_probe, },
2484         { .compatible = "arm,cortex-a7-gic",    .data = vgic_v2_probe, },
2485         { .compatible = "arm,gic-400",          .data = vgic_v2_probe, },
2486         { .compatible = "arm,gic-v3",           .data = vgic_v3_probe, },
2487         {},
2488 };
2489
2490 int kvm_vgic_hyp_init(void)
2491 {
2492         const struct of_device_id *matched_id;
2493         const int (*vgic_probe)(struct device_node *,const struct vgic_ops **,
2494                                 const struct vgic_params **);
2495         struct device_node *vgic_node;
2496         int ret;
2497
2498         vgic_node = of_find_matching_node_and_match(NULL,
2499                                                     vgic_ids, &matched_id);
2500         if (!vgic_node) {
2501                 kvm_err("error: no compatible GIC node found\n");
2502                 return -ENODEV;
2503         }
2504
2505         vgic_probe = matched_id->data;
2506         ret = vgic_probe(vgic_node, &vgic_ops, &vgic);
2507         if (ret)
2508                 return ret;
2509
2510         ret = request_percpu_irq(vgic->maint_irq, vgic_maintenance_handler,
2511                                  "vgic", kvm_get_running_vcpus());
2512         if (ret) {
2513                 kvm_err("Cannot register interrupt %d\n", vgic->maint_irq);
2514                 return ret;
2515         }
2516
2517         ret = __register_cpu_notifier(&vgic_cpu_nb);
2518         if (ret) {
2519                 kvm_err("Cannot register vgic CPU notifier\n");
2520                 goto out_free_irq;
2521         }
2522
2523         on_each_cpu(vgic_init_maintenance_interrupt, NULL, 1);
2524
2525         return 0;
2526
2527 out_free_irq:
2528         free_percpu_irq(vgic->maint_irq, kvm_get_running_vcpus());
2529         return ret;
2530 }
2531
2532 int kvm_irq_map_gsi(struct kvm *kvm,
2533                     struct kvm_kernel_irq_routing_entry *entries,
2534                     int gsi)
2535 {
2536         return 0;
2537 }
2538
2539 int kvm_irq_map_chip_pin(struct kvm *kvm, unsigned irqchip, unsigned pin)
2540 {
2541         return pin;
2542 }
2543
2544 int kvm_set_irq(struct kvm *kvm, int irq_source_id,
2545                 u32 irq, int level, bool line_status)
2546 {
2547         unsigned int spi = irq + VGIC_NR_PRIVATE_IRQS;
2548
2549         trace_kvm_set_irq(irq, level, irq_source_id);
2550
2551         BUG_ON(!vgic_initialized(kvm));
2552
2553         return kvm_vgic_inject_irq(kvm, 0, spi, level);
2554 }
2555
2556 /* MSI not implemented yet */
2557 int kvm_set_msi(struct kvm_kernel_irq_routing_entry *e,
2558                 struct kvm *kvm, int irq_source_id,
2559                 int level, bool line_status)
2560 {
2561         return 0;
2562 }